#ifndef CUFFTDX_FFT_729_FP64_FWD_PTX_HPP
#define CUFFTDX_FFT_729_FP64_FWD_PTX_HPP



template<> __forceinline__ __device__ void cufftdx_private_function<523, double, 1>(cufftdx::detail::complex<double> *rmem, unsigned smem){

asm volatile (R"({
.reg .b32 r<18>;
.reg .f64 fd<1850>;
.reg .b64 rd<9>;
mov.u32 r16, %tid.y;
mov.u32 r17, %54;
mad.lo.s32 r3, r16, 5832, r17;
add.f64 fd109, %74, %92;
add.f64 fd110, %56, fd109;
mul.f64 fd113, fd109, 0d3FE0000000000000;
sub.f64 fd114, %56, fd113;
add.f64 fd1841, %75, %93;
sub.f64 fd115, %75, %93;
mul.f64 fd116, fd115, 0d3FEBB67AE8584CAA;
add.f64 fd117, fd116, fd114;
sub.f64 fd118, fd114, fd116;
add.f64 fd1840, %57, fd1841;
mul.f64 fd119, fd1841, 0d3FE0000000000000;
sub.f64 fd120, %57, fd119;
sub.f64 fd121, %74, %92;
mul.f64 fd122, fd121, 0d3FEBB67AE8584CAA;
sub.f64 fd123, fd120, fd122;
add.f64 fd124, fd122, fd120;
add.f64 fd125, %80, %98;
add.f64 fd126, %62, fd125;
mul.f64 fd129, fd125, 0d3FE0000000000000;
sub.f64 fd130, %62, fd129;
add.f64 fd1839, %81, %99;
sub.f64 fd131, %81, %99;
mul.f64 fd132, fd131, 0d3FEBB67AE8584CAA;
add.f64 fd133, fd132, fd130;
sub.f64 fd134, fd130, fd132;
add.f64 fd1838, %63, fd1839;
mul.f64 fd135, fd1839, 0d3FE0000000000000;
sub.f64 fd136, %63, fd135;
sub.f64 fd137, %80, %98;
mul.f64 fd138, fd137, 0d3FEBB67AE8584CAA;
sub.f64 fd139, fd136, fd138;
add.f64 fd140, fd138, fd136;
add.f64 fd141, %86, %104;
add.f64 fd142, %68, fd141;
mul.f64 fd145, fd141, 0d3FE0000000000000;
sub.f64 fd146, %68, fd145;
add.f64 fd1837, %87, %105;
sub.f64 fd147, %87, %105;
mul.f64 fd148, fd147, 0d3FEBB67AE8584CAA;
add.f64 fd149, fd148, fd146;
sub.f64 fd150, fd146, fd148;
add.f64 fd1836, %69, fd1837;
mul.f64 fd151, fd1837, 0d3FE0000000000000;
sub.f64 fd152, %69, fd151;
sub.f64 fd153, %86, %104;
mul.f64 fd154, fd153, 0d3FEBB67AE8584CAA;
sub.f64 fd155, fd152, fd154;
add.f64 fd156, fd154, fd152;
mul.f64 fd158, fd139, 0dBFE491B7523C161D;
mul.f64 fd1835, fd133, 0d3FE8836FA2CF5039;
sub.f64 fd159, fd1835, fd158;
mul.f64 fd160, fd139, 0d3FE8836FA2CF5039;
fma.rn.f64 fd161, fd133, 0dBFE491B7523C161D, fd160;
mul.f64 fd1833, fd149, 0d3FC63A1A7E0B738A;
mul.f64 fd1834, fd155, 0dBFEF838B8C811C17;
sub.f64 fd164, fd1833, fd1834;
mul.f64 fd165, fd155, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd166, fd149, 0dBFEF838B8C811C17, fd165;
mul.f64 fd1831, fd134, 0d3FC63A1A7E0B738A;
mul.f64 fd1832, fd140, 0dBFEF838B8C811C17;
sub.f64 fd169, fd1831, fd1832;
mul.f64 fd170, fd140, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd171, fd134, 0dBFEF838B8C811C17, fd170;
mul.f64 fd1829, fd150, 0dBFEE11F642522D1C;
mul.f64 fd1830, fd156, 0dBFD5E3A8748A0BF5;
sub.f64 fd174, fd1829, fd1830;
mul.f64 fd175, fd156, 0dBFEE11F642522D1C;
fma.rn.f64 fd176, fd150, 0dBFD5E3A8748A0BF5, fd175;
add.f64 fd177, fd126, fd142;
add.f64 fd178, fd110, fd177;
mul.f64 fd181, fd177, 0d3FE0000000000000;
sub.f64 fd182, fd110, fd181;
add.f64 fd1828, fd1838, fd1836;
sub.f64 fd183, fd1838, fd1836;
mul.f64 fd184, fd183, 0d3FEBB67AE8584CAA;
add.f64 fd185, fd184, fd182;
sub.f64 fd186, fd182, fd184;
add.f64 fd1827, fd1840, fd1828;
mul.f64 fd187, fd1828, 0d3FE0000000000000;
sub.f64 fd188, fd1840, fd187;
sub.f64 fd189, fd126, fd142;
mul.f64 fd190, fd189, 0d3FEBB67AE8584CAA;
sub.f64 fd191, fd188, fd190;
add.f64 fd192, fd190, fd188;
add.f64 fd193, fd159, fd164;
add.f64 fd194, fd117, fd193;
mul.f64 fd197, fd193, 0d3FE0000000000000;
sub.f64 fd198, fd117, fd197;
add.f64 fd1826, fd161, fd166;
sub.f64 fd199, fd161, fd166;
mul.f64 fd200, fd199, 0d3FEBB67AE8584CAA;
add.f64 fd201, fd200, fd198;
sub.f64 fd202, fd198, fd200;
add.f64 fd1825, fd123, fd1826;
mul.f64 fd203, fd1826, 0d3FE0000000000000;
sub.f64 fd204, fd123, fd203;
sub.f64 fd205, fd159, fd164;
mul.f64 fd206, fd205, 0d3FEBB67AE8584CAA;
sub.f64 fd207, fd204, fd206;
add.f64 fd208, fd206, fd204;
add.f64 fd209, fd169, fd174;
add.f64 fd210, fd118, fd209;
mul.f64 fd213, fd209, 0d3FE0000000000000;
sub.f64 fd214, fd118, fd213;
add.f64 fd1824, fd171, fd176;
sub.f64 fd215, fd171, fd176;
mul.f64 fd216, fd215, 0d3FEBB67AE8584CAA;
add.f64 fd217, fd216, fd214;
sub.f64 fd218, fd214, fd216;
add.f64 fd1823, fd124, fd1824;
mul.f64 fd219, fd1824, 0d3FE0000000000000;
sub.f64 fd220, fd124, fd219;
sub.f64 fd221, fd169, fd174;
mul.f64 fd222, fd221, 0d3FEBB67AE8584CAA;
sub.f64 fd223, fd220, fd222;
add.f64 fd224, fd222, fd220;
add.f64 fd225, %76, %94;
add.f64 fd226, %58, fd225;
mul.f64 fd229, fd225, 0d3FE0000000000000;
sub.f64 fd230, %58, fd229;
add.f64 fd1820, %110, %111;
sub.f64 fd231, %110, %111;
mul.f64 fd232, fd231, 0d3FEBB67AE8584CAA;
add.f64 fd233, fd232, fd230;
sub.f64 fd234, fd230, fd232;
add.f64 fd1818, %112, fd1820;
mul.f64 fd235, fd1820, 0d3FE0000000000000;
sub.f64 fd236, %112, fd235;
sub.f64 fd237, %76, %94;
mul.f64 fd238, fd237, 0d3FEBB67AE8584CAA;
sub.f64 fd239, fd236, fd238;
add.f64 fd240, fd238, fd236;
add.f64 fd241, %82, %100;
add.f64 fd242, %64, fd241;
mul.f64 fd245, fd241, 0d3FE0000000000000;
sub.f64 fd246, %64, fd245;
add.f64 fd1815, %114, %113;
sub.f64 fd247, %114, %113;
mul.f64 fd248, fd247, 0d3FEBB67AE8584CAA;
add.f64 fd249, fd248, fd246;
sub.f64 fd250, fd246, fd248;
add.f64 fd1813, %115, fd1815;
mul.f64 fd251, fd1815, 0d3FE0000000000000;
sub.f64 fd252, %115, fd251;
sub.f64 fd253, %82, %100;
mul.f64 fd254, fd253, 0d3FEBB67AE8584CAA;
sub.f64 fd255, fd252, fd254;
add.f64 fd256, fd254, fd252;
add.f64 fd257, %88, %106;
add.f64 fd258, %70, fd257;
mul.f64 fd261, fd257, 0d3FE0000000000000;
sub.f64 fd262, %70, fd261;
add.f64 fd1810, %116, %117;
sub.f64 fd263, %116, %117;
mul.f64 fd264, fd263, 0d3FEBB67AE8584CAA;
add.f64 fd265, fd264, fd262;
sub.f64 fd266, fd262, fd264;
add.f64 fd1808, %118, fd1810;
mul.f64 fd267, fd1810, 0d3FE0000000000000;
sub.f64 fd268, %118, fd267;
sub.f64 fd269, %88, %106;
mul.f64 fd270, fd269, 0d3FEBB67AE8584CAA;
sub.f64 fd271, fd268, fd270;
add.f64 fd272, fd270, fd268;
mul.f64 fd274, fd255, 0dBFE491B7523C161D;
mul.f64 fd1807, fd249, 0d3FE8836FA2CF5039;
sub.f64 fd275, fd1807, fd274;
mul.f64 fd276, fd255, 0d3FE8836FA2CF5039;
fma.rn.f64 fd277, fd249, 0dBFE491B7523C161D, fd276;
mul.f64 fd279, fd271, 0dBFEF838B8C811C17;
mul.f64 fd1806, fd265, 0d3FC63A1A7E0B738A;
sub.f64 fd280, fd1806, fd279;
mul.f64 fd281, fd271, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd282, fd265, 0dBFEF838B8C811C17, fd281;
mul.f64 fd1804, fd250, 0d3FC63A1A7E0B738A;
mul.f64 fd1805, fd256, 0dBFEF838B8C811C17;
sub.f64 fd285, fd1804, fd1805;
mul.f64 fd286, fd256, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd287, fd250, 0dBFEF838B8C811C17, fd286;
mul.f64 fd1802, fd266, 0dBFEE11F642522D1C;
mul.f64 fd1803, fd272, 0dBFD5E3A8748A0BF5;
sub.f64 fd290, fd1802, fd1803;
mul.f64 fd291, fd272, 0dBFEE11F642522D1C;
fma.rn.f64 fd292, fd266, 0dBFD5E3A8748A0BF5, fd291;
add.f64 fd293, fd242, fd258;
add.f64 fd294, fd226, fd293;
mul.f64 fd297, fd293, 0d3FE0000000000000;
sub.f64 fd298, fd226, fd297;
add.f64 fd1801, fd1813, fd1808;
sub.f64 fd299, fd1813, fd1808;
mul.f64 fd300, fd299, 0d3FEBB67AE8584CAA;
add.f64 fd301, fd300, fd298;
sub.f64 fd302, fd298, fd300;
add.f64 fd1800, fd1818, fd1801;
mul.f64 fd303, fd1801, 0d3FE0000000000000;
sub.f64 fd304, fd1818, fd303;
sub.f64 fd305, fd242, fd258;
mul.f64 fd306, fd305, 0d3FEBB67AE8584CAA;
sub.f64 fd307, fd304, fd306;
add.f64 fd308, fd306, fd304;
add.f64 fd309, fd275, fd280;
add.f64 fd310, fd233, fd309;
mul.f64 fd313, fd309, 0d3FE0000000000000;
sub.f64 fd314, fd233, fd313;
add.f64 fd1799, fd277, fd282;
sub.f64 fd315, fd277, fd282;
mul.f64 fd316, fd315, 0d3FEBB67AE8584CAA;
add.f64 fd317, fd316, fd314;
sub.f64 fd318, fd314, fd316;
add.f64 fd1798, fd239, fd1799;
mul.f64 fd319, fd1799, 0d3FE0000000000000;
sub.f64 fd320, fd239, fd319;
sub.f64 fd321, fd275, fd280;
mul.f64 fd322, fd321, 0d3FEBB67AE8584CAA;
sub.f64 fd323, fd320, fd322;
add.f64 fd324, fd322, fd320;
add.f64 fd325, fd285, fd290;
add.f64 fd326, fd234, fd325;
mul.f64 fd329, fd325, 0d3FE0000000000000;
sub.f64 fd330, fd234, fd329;
add.f64 fd1797, fd287, fd292;
sub.f64 fd331, fd287, fd292;
mul.f64 fd332, fd331, 0d3FEBB67AE8584CAA;
add.f64 fd333, fd332, fd330;
sub.f64 fd334, fd330, fd332;
add.f64 fd1796, fd240, fd1797;
mul.f64 fd335, fd1797, 0d3FE0000000000000;
sub.f64 fd336, fd240, fd335;
sub.f64 fd337, fd285, fd290;
mul.f64 fd338, fd337, 0d3FEBB67AE8584CAA;
sub.f64 fd339, fd336, fd338;
add.f64 fd340, fd338, fd336;
add.f64 fd341, %78, %96;
add.f64 fd342, %60, fd341;
mul.f64 fd345, fd341, 0d3FE0000000000000;
sub.f64 fd346, %60, fd345;
add.f64 fd1793, %119, %120;
sub.f64 fd347, %119, %120;
mul.f64 fd348, fd347, 0d3FEBB67AE8584CAA;
add.f64 fd349, fd348, fd346;
sub.f64 fd350, fd346, fd348;
add.f64 fd1791, %121, fd1793;
mul.f64 fd351, fd1793, 0d3FE0000000000000;
sub.f64 fd352, %121, fd351;
sub.f64 fd353, %78, %96;
mul.f64 fd354, fd353, 0d3FEBB67AE8584CAA;
sub.f64 fd355, fd352, fd354;
add.f64 fd356, fd354, fd352;
add.f64 fd357, %84, %102;
add.f64 fd358, %66, fd357;
mul.f64 fd361, fd357, 0d3FE0000000000000;
sub.f64 fd362, %66, fd361;
add.f64 fd1788, %123, %122;
sub.f64 fd363, %123, %122;
mul.f64 fd364, fd363, 0d3FEBB67AE8584CAA;
add.f64 fd365, fd364, fd362;
sub.f64 fd366, fd362, fd364;
add.f64 fd1786, %124, fd1788;
mul.f64 fd367, fd1788, 0d3FE0000000000000;
sub.f64 fd368, %124, fd367;
sub.f64 fd369, %84, %102;
mul.f64 fd370, fd369, 0d3FEBB67AE8584CAA;
sub.f64 fd371, fd368, fd370;
add.f64 fd372, fd370, fd368;
add.f64 fd373, %90, %108;
add.f64 fd374, %72, fd373;
mul.f64 fd377, fd373, 0d3FE0000000000000;
sub.f64 fd378, %72, fd377;
add.f64 fd1784, %125, %109;
sub.f64 fd379, %125, %109;
mul.f64 fd380, fd379, 0d3FEBB67AE8584CAA;
add.f64 fd381, fd380, fd378;
sub.f64 fd382, fd378, fd380;
add.f64 fd1782, %126, fd1784;
mul.f64 fd383, fd1784, 0d3FE0000000000000;
sub.f64 fd384, %126, fd383;
sub.f64 fd385, %90, %108;
mul.f64 fd386, fd385, 0d3FEBB67AE8584CAA;
sub.f64 fd387, fd384, fd386;
add.f64 fd388, fd386, fd384;
mul.f64 fd390, fd371, 0dBFE491B7523C161D;
mul.f64 fd1781, fd365, 0d3FE8836FA2CF5039;
sub.f64 fd391, fd1781, fd390;
mul.f64 fd392, fd371, 0d3FE8836FA2CF5039;
fma.rn.f64 fd393, fd365, 0dBFE491B7523C161D, fd392;
mul.f64 fd395, fd387, 0dBFEF838B8C811C17;
mul.f64 fd1780, fd381, 0d3FC63A1A7E0B738A;
sub.f64 fd396, fd1780, fd395;
mul.f64 fd397, fd387, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd398, fd381, 0dBFEF838B8C811C17, fd397;
mul.f64 fd1778, fd366, 0d3FC63A1A7E0B738A;
mul.f64 fd1779, fd372, 0dBFEF838B8C811C17;
sub.f64 fd401, fd1778, fd1779;
mul.f64 fd402, fd372, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd403, fd366, 0dBFEF838B8C811C17, fd402;
mul.f64 fd1776, fd382, 0dBFEE11F642522D1C;
mul.f64 fd1777, fd388, 0dBFD5E3A8748A0BF5;
sub.f64 fd406, fd1776, fd1777;
mul.f64 fd407, fd388, 0dBFEE11F642522D1C;
fma.rn.f64 fd408, fd382, 0dBFD5E3A8748A0BF5, fd407;
add.f64 fd409, fd358, fd374;
add.f64 fd410, fd342, fd409;
mul.f64 fd413, fd409, 0d3FE0000000000000;
sub.f64 fd414, fd342, fd413;
add.f64 fd1775, fd1786, fd1782;
sub.f64 fd415, fd1786, fd1782;
mul.f64 fd416, fd415, 0d3FEBB67AE8584CAA;
add.f64 fd417, fd416, fd414;
sub.f64 fd418, fd414, fd416;
add.f64 fd1774, fd1791, fd1775;
mul.f64 fd419, fd1775, 0d3FE0000000000000;
sub.f64 fd420, fd1791, fd419;
sub.f64 fd421, fd358, fd374;
mul.f64 fd422, fd421, 0d3FEBB67AE8584CAA;
sub.f64 fd423, fd420, fd422;
add.f64 fd424, fd422, fd420;
add.f64 fd425, fd391, fd396;
add.f64 fd426, fd349, fd425;
mul.f64 fd429, fd425, 0d3FE0000000000000;
sub.f64 fd430, fd349, fd429;
add.f64 fd1773, fd393, fd398;
sub.f64 fd431, fd393, fd398;
mul.f64 fd432, fd431, 0d3FEBB67AE8584CAA;
add.f64 fd433, fd432, fd430;
sub.f64 fd434, fd430, fd432;
add.f64 fd1772, fd355, fd1773;
mul.f64 fd435, fd1773, 0d3FE0000000000000;
sub.f64 fd436, fd355, fd435;
sub.f64 fd437, fd391, fd396;
mul.f64 fd438, fd437, 0d3FEBB67AE8584CAA;
sub.f64 fd439, fd436, fd438;
add.f64 fd440, fd438, fd436;
add.f64 fd441, fd401, fd406;
add.f64 fd442, fd350, fd441;
mul.f64 fd445, fd441, 0d3FE0000000000000;
sub.f64 fd446, fd350, fd445;
add.f64 fd1771, fd403, fd408;
sub.f64 fd447, fd403, fd408;
mul.f64 fd448, fd447, 0d3FEBB67AE8584CAA;
add.f64 fd449, fd448, fd446;
sub.f64 fd450, fd446, fd448;
add.f64 fd1770, fd356, fd1771;
mul.f64 fd451, fd1771, 0d3FE0000000000000;
sub.f64 fd452, fd356, fd451;
sub.f64 fd453, fd401, fd406;
mul.f64 fd454, fd453, 0d3FEBB67AE8584CAA;
sub.f64 fd455, fd452, fd454;
add.f64 fd456, fd454, fd452;
mul.f64 fd458, fd1798, 0dBFCD84D223638000;
mul.f64 fd1769, fd310, 0d3FEF232EFF15C9E6;
sub.f64 fd459, fd1769, fd458;
mul.f64 fd460, fd1798, 0d3FEF232EFF15C9E6;
fma.rn.f64 fd461, fd310, 0dBFCD84D223638000, fd460;
mul.f64 fd1767, fd426, 0d3FEC98A37A9A7850;
mul.f64 fd1768, fd1772, 0dBFDCB920325BAFA6;
sub.f64 fd464, fd1767, fd1768;
mul.f64 fd465, fd1772, 0d3FEC98A37A9A7850;
fma.rn.f64 fd466, fd426, 0dBFDCB920325BAFA6, fd465;
mul.f64 fd1765, fd326, 0d3FEC98A37A9A7850;
mul.f64 fd1766, fd1796, 0dBFDCB920325BAFA6;
sub.f64 fd469, fd1765, fd1766;
mul.f64 fd470, fd1796, 0d3FEC98A37A9A7850;
fma.rn.f64 fd471, fd326, 0dBFDCB920325BAFA6, fd470;
mul.f64 fd1763, fd442, 0d3FE31BEC55BC71BC;
mul.f64 fd1764, fd1770, 0dBFE9AAFE4207DF5F;
sub.f64 fd474, fd1763, fd1764;
mul.f64 fd475, fd1770, 0d3FE31BEC55BC71BC;
fma.rn.f64 fd476, fd442, 0dBFE9AAFE4207DF5F, fd475;
mul.f64 fd1761, fd301, 0d3FE8836FA2CF5039;
mul.f64 fd1762, fd307, 0dBFE491B7523C161D;
sub.f64 fd479, fd1761, fd1762;
mul.f64 fd480, fd307, 0d3FE8836FA2CF5039;
fma.rn.f64 fd481, fd301, 0dBFE491B7523C161D, fd480;
mul.f64 fd483, fd423, 0dBFEF838B8C811C17;
mul.f64 fd1760, fd417, 0d3FC63A1A7E0B738A;
sub.f64 fd484, fd1760, fd483;
mul.f64 fd485, fd423, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd486, fd417, 0dBFEF838B8C811C17, fd485;
mul.f64 fd488, fd323, 0dBFE9AAFE4207DF5F;
mul.f64 fd1759, fd317, 0d3FE31BEC55BC71BC;
sub.f64 fd489, fd1759, fd488;
mul.f64 fd490, fd323, 0d3FE31BEC55BC71BC;
fma.rn.f64 fd491, fd317, 0dBFE9AAFE4207DF5F, fd490;
mul.f64 fd493, fd439, 0dBFEEA7D99F29CADE;
mul.f64 fd1758, fd433, 0dBFD25AFBF23865BF;
sub.f64 fd494, fd1758, fd493;
mul.f64 fd495, fd439, 0dBFD25AFBF23865BF;
fma.rn.f64 fd496, fd433, 0dBFEEA7D99F29CADE, fd495;
mul.f64 fd498, fd339, 0dBFED6206BEB6C24B;
mul.f64 fd1757, fd333, 0d3FD9595EF26FB670;
sub.f64 fd499, fd1757, fd498;
mul.f64 fd500, fd339, 0d3FD9595EF26FB670;
fma.rn.f64 fd501, fd333, 0dBFED6206BEB6C24B, fd500;
mul.f64 fd503, fd455, 0dBFE746A51650EADE;
mul.f64 fd1756, fd449, 0dBFE5F5B105F99707;
sub.f64 fd504, fd1756, fd503;
mul.f64 fd505, fd455, 0dBFE5F5B105F99707;
fma.rn.f64 fd506, fd449, 0dBFE746A51650EADE, fd505;
mul.f64 fd508, fd308, 0dBFEF838B8C811C17;
mul.f64 fd1755, fd302, 0d3FC63A1A7E0B738A;
sub.f64 fd509, fd1755, fd508;
mul.f64 fd510, fd308, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd511, fd302, 0dBFEF838B8C811C17, fd510;
mul.f64 fd1753, fd418, 0dBFEE11F642522D1C;
mul.f64 fd1754, fd424, 0dBFD5E3A8748A0BF5;
sub.f64 fd514, fd1753, fd1754;
mul.f64 fd515, fd424, 0dBFEE11F642522D1C;
fma.rn.f64 fd516, fd418, 0dBFD5E3A8748A0BF5, fd515;
mul.f64 fd1751, fd318, 0dBFADC528B5343A86;
mul.f64 fd1752, fd324, 0dBFEFF223F3635CE3;
sub.f64 fd519, fd1751, fd1752;
mul.f64 fd520, fd324, 0dBFADC528B5343A86;
fma.rn.f64 fd521, fd318, 0dBFEFF223F3635CE3, fd520;
mul.f64 fd1749, fd434, 0dBFEFC89BCEF44CF4;
mul.f64 fd1750, fd440, 0d3FBDB843E577175E;
sub.f64 fd524, fd1749, fd1750;
mul.f64 fd525, fd440, 0dBFEFC89BCEF44CF4;
fma.rn.f64 fd526, fd434, 0d3FBDB843E577175E, fd525;
mul.f64 fd528, fd340, 0dBFEEA7D99F29CADE;
mul.f64 fd1748, fd334, 0dBFD25AFBF23865BF;
sub.f64 fd529, fd1748, fd528;
mul.f64 fd530, fd340, 0dBFD25AFBF23865BF;
fma.rn.f64 fd531, fd334, 0dBFEEA7D99F29CADE, fd530;
mul.f64 fd533, fd456, 0d3FE19593DA358510;
mul.f64 fd1747, fd450, 0dBFEABC50EF4734A7;
sub.f64 fd534, fd1747, fd533;
mul.f64 fd535, fd456, 0dBFEABC50EF4734A7;
fma.rn.f64 fd536, fd450, 0d3FE19593DA358510, fd535;
add.f64 fd537, fd294, fd410;
add.f64 fd538, fd178, fd537;
mul.f64 fd541, fd537, 0d3FE0000000000000;
sub.f64 fd542, fd178, fd541;
add.f64 fd1746, fd1800, fd1774;
sub.f64 fd543, fd1800, fd1774;
mul.f64 fd544, fd543, 0d3FEBB67AE8584CAA;
add.f64 fd545, fd544, fd542;
sub.f64 fd546, fd542, fd544;
add.f64 fd1745, fd1827, fd1746;
mul.f64 fd547, fd1746, 0d3FE0000000000000;
sub.f64 fd548, fd1827, fd547;
sub.f64 fd549, fd294, fd410;
mul.f64 fd550, fd549, 0d3FEBB67AE8584CAA;
sub.f64 fd551, fd548, fd550;
add.f64 fd552, fd550, fd548;
add.f64 fd553, fd459, fd464;
add.f64 fd554, fd194, fd553;
mul.f64 fd557, fd553, 0d3FE0000000000000;
sub.f64 fd558, fd194, fd557;
add.f64 fd1744, fd461, fd466;
sub.f64 fd559, fd461, fd466;
mul.f64 fd560, fd559, 0d3FEBB67AE8584CAA;
add.f64 fd561, fd560, fd558;
sub.f64 fd562, fd558, fd560;
add.f64 fd1743, fd1825, fd1744;
mul.f64 fd563, fd1744, 0d3FE0000000000000;
sub.f64 fd564, fd1825, fd563;
sub.f64 fd565, fd459, fd464;
mul.f64 fd566, fd565, 0d3FEBB67AE8584CAA;
sub.f64 fd567, fd564, fd566;
add.f64 fd568, fd566, fd564;
add.f64 fd569, fd469, fd474;
add.f64 fd570, fd210, fd569;
mul.f64 fd573, fd569, 0d3FE0000000000000;
sub.f64 fd574, fd210, fd573;
add.f64 fd1742, fd471, fd476;
sub.f64 fd575, fd471, fd476;
mul.f64 fd576, fd575, 0d3FEBB67AE8584CAA;
add.f64 fd577, fd576, fd574;
sub.f64 fd578, fd574, fd576;
add.f64 fd1741, fd1823, fd1742;
mul.f64 fd579, fd1742, 0d3FE0000000000000;
sub.f64 fd580, fd1823, fd579;
sub.f64 fd581, fd469, fd474;
mul.f64 fd582, fd581, 0d3FEBB67AE8584CAA;
sub.f64 fd583, fd580, fd582;
add.f64 fd584, fd582, fd580;
add.f64 fd585, fd479, fd484;
add.f64 fd586, fd185, fd585;
mul.f64 fd589, fd585, 0d3FE0000000000000;
sub.f64 fd590, fd185, fd589;
add.f64 fd1740, fd481, fd486;
sub.f64 fd591, fd481, fd486;
mul.f64 fd592, fd591, 0d3FEBB67AE8584CAA;
add.f64 fd593, fd592, fd590;
sub.f64 fd594, fd590, fd592;
add.f64 fd1739, fd191, fd1740;
mul.f64 fd595, fd1740, 0d3FE0000000000000;
sub.f64 fd596, fd191, fd595;
sub.f64 fd597, fd479, fd484;
mul.f64 fd598, fd597, 0d3FEBB67AE8584CAA;
sub.f64 fd599, fd596, fd598;
add.f64 fd600, fd598, fd596;
add.f64 fd601, fd489, fd494;
add.f64 fd602, fd201, fd601;
mul.f64 fd605, fd601, 0d3FE0000000000000;
sub.f64 fd606, fd201, fd605;
add.f64 fd1738, fd491, fd496;
sub.f64 fd607, fd491, fd496;
mul.f64 fd608, fd607, 0d3FEBB67AE8584CAA;
add.f64 fd609, fd608, fd606;
sub.f64 fd610, fd606, fd608;
add.f64 fd1737, fd207, fd1738;
mul.f64 fd611, fd1738, 0d3FE0000000000000;
sub.f64 fd612, fd207, fd611;
sub.f64 fd613, fd489, fd494;
mul.f64 fd614, fd613, 0d3FEBB67AE8584CAA;
sub.f64 fd615, fd612, fd614;
add.f64 fd616, fd614, fd612;
add.f64 fd617, fd499, fd504;
add.f64 fd618, fd217, fd617;
mul.f64 fd621, fd617, 0d3FE0000000000000;
sub.f64 fd622, fd217, fd621;
add.f64 fd1736, fd501, fd506;
sub.f64 fd623, fd501, fd506;
mul.f64 fd624, fd623, 0d3FEBB67AE8584CAA;
add.f64 fd625, fd624, fd622;
sub.f64 fd626, fd622, fd624;
add.f64 fd1735, fd223, fd1736;
mul.f64 fd627, fd1736, 0d3FE0000000000000;
sub.f64 fd628, fd223, fd627;
sub.f64 fd629, fd499, fd504;
mul.f64 fd630, fd629, 0d3FEBB67AE8584CAA;
sub.f64 fd631, fd628, fd630;
add.f64 fd632, fd630, fd628;
add.f64 fd633, fd509, fd514;
add.f64 fd634, fd186, fd633;
mul.f64 fd637, fd633, 0d3FE0000000000000;
sub.f64 fd638, fd186, fd637;
add.f64 fd1734, fd511, fd516;
sub.f64 fd639, fd511, fd516;
mul.f64 fd640, fd639, 0d3FEBB67AE8584CAA;
add.f64 fd641, fd640, fd638;
sub.f64 fd642, fd638, fd640;
add.f64 fd1733, fd192, fd1734;
mul.f64 fd643, fd1734, 0d3FE0000000000000;
sub.f64 fd644, fd192, fd643;
sub.f64 fd645, fd509, fd514;
mul.f64 fd646, fd645, 0d3FEBB67AE8584CAA;
sub.f64 fd647, fd644, fd646;
add.f64 fd648, fd646, fd644;
add.f64 fd649, fd519, fd524;
add.f64 fd650, fd202, fd649;
mul.f64 fd653, fd649, 0d3FE0000000000000;
sub.f64 fd654, fd202, fd653;
add.f64 fd1732, fd521, fd526;
sub.f64 fd655, fd521, fd526;
mul.f64 fd656, fd655, 0d3FEBB67AE8584CAA;
add.f64 fd657, fd656, fd654;
sub.f64 fd658, fd654, fd656;
add.f64 fd1731, fd208, fd1732;
mul.f64 fd659, fd1732, 0d3FE0000000000000;
sub.f64 fd660, fd208, fd659;
sub.f64 fd661, fd519, fd524;
mul.f64 fd662, fd661, 0d3FEBB67AE8584CAA;
sub.f64 fd663, fd660, fd662;
add.f64 fd664, fd662, fd660;
add.f64 fd665, fd529, fd534;
add.f64 fd666, fd218, fd665;
mul.f64 fd669, fd665, 0d3FE0000000000000;
sub.f64 fd670, fd218, fd669;
add.f64 fd1730, fd531, fd536;
sub.f64 fd671, fd531, fd536;
mul.f64 fd672, fd671, 0d3FEBB67AE8584CAA;
add.f64 fd673, fd672, fd670;
sub.f64 fd674, fd670, fd672;
add.f64 fd1729, fd224, fd1730;
mul.f64 fd675, fd1730, 0d3FE0000000000000;
sub.f64 fd676, fd224, fd675;
sub.f64 fd677, fd529, fd534;
mul.f64 fd678, fd677, 0d3FEBB67AE8584CAA;
sub.f64 fd679, fd676, fd678;
add.f64 fd680, fd678, fd676;
mov.u32 r15, %tid.x;
mul.wide.u32 rd2, r15, 795364315;
shr.u64 rd3, rd2, 32;
cvt.u32.u64 r5, rd3;
sub.s32 r6, r15, r5;
shr.u32 r7, r6, 1;
add.s32 r8, r7, r5;
shr.u32 r9, r8, 4;
mul.lo.s32 r10, r9, 27;
sub.s32 r11, r15, r10;
mul.wide.u32 rd7, r11, 16;
mov.u64 rd8, %55;
add.s64 rd6, rd8, rd7;
ld.global.v2.f64 {fd681, fd682}, [rd6];
mul.f64 fd1727, fd681, fd554;
mul.f64 fd1728, fd682, fd1743;
sub.f64 fd687, fd1727, fd1728;
mul.f64 fd688, fd681, fd1743;
fma.rn.f64 fd689, fd682, fd554, fd688;
mul.f64 fd1725, fd681, fd681;
mul.f64 fd1726, fd682, fd682;
sub.f64 fd692, fd1725, fd1726;
mul.f64 fd693, fd682, fd681;
fma.rn.f64 fd694, fd682, fd681, fd693;
mul.f64 fd1723, fd692, fd570;
mul.f64 fd1724, fd694, fd1741;
sub.f64 fd697, fd1723, fd1724;
mul.f64 fd698, fd692, fd1741;
fma.rn.f64 fd699, fd694, fd570, fd698;
mul.f64 fd701, fd682, fd694;
mul.f64 fd1722, fd681, fd692;
sub.f64 fd702, fd1722, fd701;
mul.f64 fd703, fd681, fd694;
fma.rn.f64 fd704, fd682, fd692, fd703;
mul.f64 fd706, fd704, fd1739;
mul.f64 fd1721, fd702, fd586;
sub.f64 fd707, fd1721, fd706;
mul.f64 fd708, fd702, fd1739;
fma.rn.f64 fd709, fd704, fd586, fd708;
mul.f64 fd711, fd682, fd704;
mul.f64 fd1720, fd681, fd702;
sub.f64 fd712, fd1720, fd711;
mul.f64 fd713, fd681, fd704;
fma.rn.f64 fd714, fd682, fd702, fd713;
mul.f64 fd716, fd714, fd1737;
mul.f64 fd1719, fd712, fd602;
sub.f64 fd717, fd1719, fd716;
mul.f64 fd718, fd712, fd1737;
fma.rn.f64 fd719, fd714, fd602, fd718;
mul.f64 fd721, fd682, fd714;
mul.f64 fd1718, fd681, fd712;
sub.f64 fd722, fd1718, fd721;
mul.f64 fd723, fd681, fd714;
fma.rn.f64 fd724, fd682, fd712, fd723;
mul.f64 fd1716, fd722, fd618;
mul.f64 fd1717, fd724, fd1735;
sub.f64 fd727, fd1716, fd1717;
mul.f64 fd728, fd722, fd1735;
fma.rn.f64 fd729, fd724, fd618, fd728;
mul.f64 fd1714, fd681, fd722;
mul.f64 fd1715, fd682, fd724;
sub.f64 fd732, fd1714, fd1715;
mul.f64 fd733, fd681, fd724;
fma.rn.f64 fd734, fd682, fd722, fd733;
mul.f64 fd1712, fd732, fd634;
mul.f64 fd1713, fd734, fd1733;
sub.f64 fd737, fd1712, fd1713;
mul.f64 fd738, fd732, fd1733;
fma.rn.f64 fd739, fd734, fd634, fd738;
mul.f64 fd1710, fd681, fd732;
mul.f64 fd1711, fd682, fd734;
sub.f64 fd742, fd1710, fd1711;
mul.f64 fd743, fd681, fd734;
fma.rn.f64 fd744, fd682, fd732, fd743;
mul.f64 fd746, fd744, fd1731;
mul.f64 fd1709, fd742, fd650;
sub.f64 fd747, fd1709, fd746;
mul.f64 fd748, fd742, fd1731;
fma.rn.f64 fd749, fd744, fd650, fd748;
mul.f64 fd751, fd682, fd744;
mul.f64 fd1708, fd681, fd742;
sub.f64 fd752, fd1708, fd751;
mul.f64 fd753, fd681, fd744;
fma.rn.f64 fd754, fd682, fd742, fd753;
mul.f64 fd756, fd754, fd1729;
mul.f64 fd1707, fd752, fd666;
sub.f64 fd757, fd1707, fd756;
mul.f64 fd758, fd752, fd1729;
fma.rn.f64 fd759, fd754, fd666, fd758;
mul.f64 fd761, fd682, fd754;
mul.f64 fd1706, fd681, fd752;
sub.f64 fd762, fd1706, fd761;
mul.f64 fd763, fd681, fd754;
fma.rn.f64 fd764, fd682, fd752, fd763;
mul.f64 fd766, fd764, fd551;
mul.f64 fd1705, fd762, fd545;
sub.f64 fd767, fd1705, fd766;
mul.f64 fd768, fd762, fd551;
fma.rn.f64 fd769, fd764, fd545, fd768;
mul.f64 fd1703, fd681, fd762;
mul.f64 fd1704, fd682, fd764;
sub.f64 fd772, fd1703, fd1704;
mul.f64 fd773, fd681, fd764;
fma.rn.f64 fd774, fd682, fd762, fd773;
mul.f64 fd1701, fd772, fd561;
mul.f64 fd1702, fd774, fd567;
sub.f64 fd777, fd1701, fd1702;
mul.f64 fd778, fd772, fd567;
fma.rn.f64 fd779, fd774, fd561, fd778;
mul.f64 fd1699, fd681, fd772;
mul.f64 fd1700, fd682, fd774;
sub.f64 fd782, fd1699, fd1700;
mul.f64 fd783, fd681, fd774;
fma.rn.f64 fd784, fd682, fd772, fd783;
mul.f64 fd1697, fd782, fd577;
mul.f64 fd1698, fd784, fd583;
sub.f64 fd787, fd1697, fd1698;
mul.f64 fd788, fd782, fd583;
fma.rn.f64 fd789, fd784, fd577, fd788;
mul.f64 fd791, fd682, fd784;
mul.f64 fd1696, fd681, fd782;
sub.f64 fd792, fd1696, fd791;
mul.f64 fd793, fd681, fd784;
fma.rn.f64 fd794, fd682, fd782, fd793;
mul.f64 fd796, fd794, fd599;
mul.f64 fd1695, fd792, fd593;
sub.f64 fd797, fd1695, fd796;
mul.f64 fd798, fd792, fd599;
fma.rn.f64 fd799, fd794, fd593, fd798;
mul.f64 fd801, fd682, fd794;
mul.f64 fd1694, fd681, fd792;
sub.f64 fd802, fd1694, fd801;
mul.f64 fd803, fd681, fd794;
fma.rn.f64 fd804, fd682, fd792, fd803;
mul.f64 fd806, fd804, fd615;
mul.f64 fd1693, fd802, fd609;
sub.f64 fd807, fd1693, fd806;
mul.f64 fd808, fd802, fd615;
fma.rn.f64 fd809, fd804, fd609, fd808;
ld.global.v2.f64 {fd810, fd811}, [rd6+432];
mul.f64 fd815, fd811, fd631;
mul.f64 fd1692, fd810, fd625;
sub.f64 fd816, fd1692, fd815;
mul.f64 fd817, fd810, fd631;
fma.rn.f64 fd818, fd811, fd625, fd817;
mul.f64 fd820, fd682, fd811;
mul.f64 fd1691, fd681, fd810;
sub.f64 fd821, fd1691, fd820;
mul.f64 fd822, fd681, fd811;
fma.rn.f64 fd823, fd682, fd810, fd822;
mul.f64 fd825, fd823, fd647;
mul.f64 fd1690, fd821, fd641;
sub.f64 fd826, fd1690, fd825;
mul.f64 fd827, fd821, fd647;
fma.rn.f64 fd828, fd823, fd641, fd827;
mul.f64 fd830, fd682, fd823;
mul.f64 fd1689, fd681, fd821;
sub.f64 fd831, fd1689, fd830;
mul.f64 fd832, fd681, fd823;
fma.rn.f64 fd833, fd682, fd821, fd832;
mul.f64 fd1687, fd831, fd657;
mul.f64 fd1688, fd833, fd663;
sub.f64 fd836, fd1687, fd1688;
mul.f64 fd837, fd831, fd663;
fma.rn.f64 fd838, fd833, fd657, fd837;
mul.f64 fd1685, fd681, fd831;
mul.f64 fd1686, fd682, fd833;
sub.f64 fd841, fd1685, fd1686;
mul.f64 fd842, fd681, fd833;
fma.rn.f64 fd843, fd682, fd831, fd842;
mul.f64 fd1683, fd841, fd673;
mul.f64 fd1684, fd843, fd679;
sub.f64 fd846, fd1683, fd1684;
mul.f64 fd847, fd841, fd679;
fma.rn.f64 fd848, fd843, fd673, fd847;
mul.f64 fd1681, fd681, fd841;
mul.f64 fd1682, fd682, fd843;
sub.f64 fd851, fd1681, fd1682;
mul.f64 fd852, fd681, fd843;
fma.rn.f64 fd853, fd682, fd841, fd852;
mul.f64 fd855, fd853, fd552;
mul.f64 fd1680, fd851, fd546;
sub.f64 fd856, fd1680, fd855;
mul.f64 fd857, fd851, fd552;
fma.rn.f64 fd858, fd853, fd546, fd857;
mul.f64 fd860, fd682, fd853;
mul.f64 fd1679, fd681, fd851;
sub.f64 fd861, fd1679, fd860;
mul.f64 fd862, fd681, fd853;
fma.rn.f64 fd863, fd682, fd851, fd862;
mul.f64 fd865, fd863, fd568;
mul.f64 fd1678, fd861, fd562;
sub.f64 fd866, fd1678, fd865;
mul.f64 fd867, fd861, fd568;
fma.rn.f64 fd868, fd863, fd562, fd867;
mul.f64 fd870, fd682, fd863;
mul.f64 fd1677, fd681, fd861;
sub.f64 fd871, fd1677, fd870;
mul.f64 fd872, fd681, fd863;
fma.rn.f64 fd873, fd682, fd861, fd872;
mul.f64 fd875, fd873, fd584;
mul.f64 fd1676, fd871, fd578;
sub.f64 fd876, fd1676, fd875;
mul.f64 fd877, fd871, fd584;
fma.rn.f64 fd878, fd873, fd578, fd877;
mul.f64 fd880, fd682, fd873;
mul.f64 fd1675, fd681, fd871;
sub.f64 fd881, fd1675, fd880;
mul.f64 fd882, fd681, fd873;
fma.rn.f64 fd883, fd682, fd871, fd882;
mul.f64 fd1673, fd881, fd594;
mul.f64 fd1674, fd883, fd600;
sub.f64 fd886, fd1673, fd1674;
mul.f64 fd887, fd881, fd600;
fma.rn.f64 fd888, fd883, fd594, fd887;
mul.f64 fd1671, fd681, fd881;
mul.f64 fd1672, fd682, fd883;
sub.f64 fd891, fd1671, fd1672;
mul.f64 fd892, fd681, fd883;
fma.rn.f64 fd893, fd682, fd881, fd892;
mul.f64 fd1669, fd891, fd610;
mul.f64 fd1670, fd893, fd616;
sub.f64 fd896, fd1669, fd1670;
mul.f64 fd897, fd891, fd616;
fma.rn.f64 fd898, fd893, fd610, fd897;
mul.f64 fd900, fd682, fd893;
mul.f64 fd1668, fd681, fd891;
sub.f64 fd901, fd1668, fd900;
mul.f64 fd902, fd681, fd893;
fma.rn.f64 fd903, fd682, fd891, fd902;
mul.f64 fd905, fd903, fd632;
mul.f64 fd1667, fd901, fd626;
sub.f64 fd906, fd1667, fd905;
mul.f64 fd907, fd901, fd632;
fma.rn.f64 fd908, fd903, fd626, fd907;
mul.f64 fd910, fd682, fd903;
mul.f64 fd1666, fd681, fd901;
sub.f64 fd911, fd1666, fd910;
mul.f64 fd912, fd681, fd903;
fma.rn.f64 fd913, fd682, fd901, fd912;
mul.f64 fd915, fd913, fd648;
mul.f64 fd1665, fd911, fd642;
sub.f64 fd916, fd1665, fd915;
mul.f64 fd917, fd911, fd648;
fma.rn.f64 fd918, fd913, fd642, fd917;
mul.f64 fd920, fd682, fd913;
mul.f64 fd1664, fd681, fd911;
sub.f64 fd921, fd1664, fd920;
mul.f64 fd922, fd681, fd913;
fma.rn.f64 fd923, fd682, fd911, fd922;
mul.f64 fd925, fd923, fd664;
mul.f64 fd1663, fd921, fd658;
sub.f64 fd926, fd1663, fd925;
mul.f64 fd927, fd921, fd664;
fma.rn.f64 fd928, fd923, fd658, fd927;
mul.f64 fd1661, fd681, fd921;
mul.f64 fd1662, fd682, fd923;
sub.f64 fd931, fd1661, fd1662;
mul.f64 fd932, fd681, fd923;
fma.rn.f64 fd933, fd682, fd921, fd932;
mul.f64 fd1659, fd931, fd674;
mul.f64 fd1660, fd933, fd680;
sub.f64 fd936, fd1659, fd1660;
mul.f64 fd937, fd931, fd680;
fma.rn.f64 fd938, fd933, fd674, fd937;
mad.lo.s32 r12, r9, 5832, r3;
barrier.sync 0;
mad.lo.s32 r13, r11, 216, r12;
st.shared.f64 [r13], fd538;
st.shared.f64 [r13+8], fd687;
st.shared.f64 [r13+16], fd697;
st.shared.f64 [r13+24], fd707;
st.shared.f64 [r13+32], fd717;
st.shared.f64 [r13+40], fd727;
st.shared.f64 [r13+48], fd737;
st.shared.f64 [r13+56], fd747;
st.shared.f64 [r13+64], fd757;
st.shared.f64 [r13+72], fd767;
st.shared.f64 [r13+80], fd777;
st.shared.f64 [r13+88], fd787;
st.shared.f64 [r13+96], fd797;
st.shared.f64 [r13+104], fd807;
st.shared.f64 [r13+112], fd816;
st.shared.f64 [r13+120], fd826;
st.shared.f64 [r13+128], fd836;
st.shared.f64 [r13+136], fd846;
st.shared.f64 [r13+144], fd856;
st.shared.f64 [r13+152], fd866;
st.shared.f64 [r13+160], fd876;
st.shared.f64 [r13+168], fd886;
st.shared.f64 [r13+176], fd896;
st.shared.f64 [r13+184], fd906;
st.shared.f64 [r13+192], fd916;
st.shared.f64 [r13+200], fd926;
st.shared.f64 [r13+208], fd936;
barrier.sync 0;
mad.lo.s32 r14, r11, -208, r13;
ld.shared.f64 fd939, [r14];
ld.shared.f64 fd940, [r14+216];
ld.shared.f64 fd941, [r14+432];
ld.shared.f64 fd942, [r14+648];
ld.shared.f64 fd943, [r14+864];
ld.shared.f64 fd944, [r14+1080];
ld.shared.f64 fd945, [r14+1296];
ld.shared.f64 fd946, [r14+1512];
ld.shared.f64 fd947, [r14+1728];
ld.shared.f64 fd948, [r14+1944];
ld.shared.f64 fd949, [r14+2160];
ld.shared.f64 fd950, [r14+2376];
ld.shared.f64 fd951, [r14+2592];
ld.shared.f64 fd952, [r14+2808];
ld.shared.f64 fd953, [r14+3024];
ld.shared.f64 fd954, [r14+3240];
ld.shared.f64 fd955, [r14+3456];
ld.shared.f64 fd956, [r14+3672];
ld.shared.f64 fd957, [r14+3888];
ld.shared.f64 fd958, [r14+4104];
ld.shared.f64 fd959, [r14+4320];
ld.shared.f64 fd960, [r14+4536];
ld.shared.f64 fd961, [r14+4752];
ld.shared.f64 fd962, [r14+4968];
ld.shared.f64 fd963, [r14+5184];
ld.shared.f64 fd964, [r14+5400];
ld.shared.f64 fd965, [r14+5616];
barrier.sync 0;
st.shared.f64 [r13], fd1745;
st.shared.f64 [r13+8], fd689;
st.shared.f64 [r13+16], fd699;
st.shared.f64 [r13+24], fd709;
st.shared.f64 [r13+32], fd719;
st.shared.f64 [r13+40], fd729;
st.shared.f64 [r13+48], fd739;
st.shared.f64 [r13+56], fd749;
st.shared.f64 [r13+64], fd759;
st.shared.f64 [r13+72], fd769;
st.shared.f64 [r13+80], fd779;
st.shared.f64 [r13+88], fd789;
st.shared.f64 [r13+96], fd799;
st.shared.f64 [r13+104], fd809;
st.shared.f64 [r13+112], fd818;
st.shared.f64 [r13+120], fd828;
st.shared.f64 [r13+128], fd838;
st.shared.f64 [r13+136], fd848;
st.shared.f64 [r13+144], fd858;
st.shared.f64 [r13+152], fd868;
st.shared.f64 [r13+160], fd878;
st.shared.f64 [r13+168], fd888;
st.shared.f64 [r13+176], fd898;
st.shared.f64 [r13+184], fd908;
st.shared.f64 [r13+192], fd918;
st.shared.f64 [r13+200], fd928;
st.shared.f64 [r13+208], fd938;
barrier.sync 0;
ld.shared.f64 fd966, [r14];
ld.shared.f64 fd967, [r14+216];
ld.shared.f64 fd968, [r14+432];
ld.shared.f64 fd969, [r14+648];
ld.shared.f64 fd970, [r14+864];
ld.shared.f64 fd971, [r14+1080];
ld.shared.f64 fd972, [r14+1296];
ld.shared.f64 fd973, [r14+1512];
ld.shared.f64 fd974, [r14+1728];
ld.shared.f64 fd975, [r14+1944];
ld.shared.f64 fd976, [r14+2160];
ld.shared.f64 fd977, [r14+2376];
ld.shared.f64 fd978, [r14+2592];
ld.shared.f64 fd979, [r14+2808];
ld.shared.f64 fd980, [r14+3024];
ld.shared.f64 fd981, [r14+3240];
ld.shared.f64 fd982, [r14+3456];
ld.shared.f64 fd983, [r14+3672];
ld.shared.f64 fd984, [r14+3888];
ld.shared.f64 fd985, [r14+4104];
ld.shared.f64 fd986, [r14+4320];
ld.shared.f64 fd987, [r14+4536];
ld.shared.f64 fd988, [r14+4752];
ld.shared.f64 fd989, [r14+4968];
ld.shared.f64 fd990, [r14+5184];
ld.shared.f64 fd991, [r14+5400];
ld.shared.f64 fd992, [r14+5616];
add.f64 fd993, fd948, fd957;
add.f64 fd994, fd939, fd993;
mul.f64 fd997, fd993, 0d3FE0000000000000;
sub.f64 fd998, fd939, fd997;
add.f64 fd1658, fd975, fd984;
sub.f64 fd999, fd975, fd984;
mul.f64 fd1000, fd999, 0d3FEBB67AE8584CAA;
add.f64 fd1001, fd1000, fd998;
sub.f64 fd1002, fd998, fd1000;
add.f64 fd1657, fd966, fd1658;
mul.f64 fd1003, fd1658, 0d3FE0000000000000;
sub.f64 fd1004, fd966, fd1003;
sub.f64 fd1005, fd948, fd957;
mul.f64 fd1006, fd1005, 0d3FEBB67AE8584CAA;
sub.f64 fd1007, fd1004, fd1006;
add.f64 fd1008, fd1006, fd1004;
add.f64 fd1009, fd951, fd960;
add.f64 fd1010, fd942, fd1009;
mul.f64 fd1013, fd1009, 0d3FE0000000000000;
sub.f64 fd1014, fd942, fd1013;
add.f64 fd1656, fd978, fd987;
sub.f64 fd1015, fd978, fd987;
mul.f64 fd1016, fd1015, 0d3FEBB67AE8584CAA;
add.f64 fd1017, fd1016, fd1014;
sub.f64 fd1018, fd1014, fd1016;
add.f64 fd1655, fd969, fd1656;
mul.f64 fd1019, fd1656, 0d3FE0000000000000;
sub.f64 fd1020, fd969, fd1019;
sub.f64 fd1021, fd951, fd960;
mul.f64 fd1022, fd1021, 0d3FEBB67AE8584CAA;
sub.f64 fd1023, fd1020, fd1022;
add.f64 fd1024, fd1022, fd1020;
add.f64 fd1025, fd954, fd963;
add.f64 fd1026, fd945, fd1025;
mul.f64 fd1029, fd1025, 0d3FE0000000000000;
sub.f64 fd1030, fd945, fd1029;
add.f64 fd1654, fd981, fd990;
sub.f64 fd1031, fd981, fd990;
mul.f64 fd1032, fd1031, 0d3FEBB67AE8584CAA;
add.f64 fd1033, fd1032, fd1030;
sub.f64 fd1034, fd1030, fd1032;
add.f64 fd1653, fd972, fd1654;
mul.f64 fd1035, fd1654, 0d3FE0000000000000;
sub.f64 fd1036, fd972, fd1035;
sub.f64 fd1037, fd954, fd963;
mul.f64 fd1038, fd1037, 0d3FEBB67AE8584CAA;
sub.f64 fd1039, fd1036, fd1038;
add.f64 fd1040, fd1038, fd1036;
mul.f64 fd1042, fd1023, 0dBFE491B7523C161D;
mul.f64 fd1652, fd1017, 0d3FE8836FA2CF5039;
sub.f64 fd1043, fd1652, fd1042;
mul.f64 fd1044, fd1023, 0d3FE8836FA2CF5039;
fma.rn.f64 fd1045, fd1017, 0dBFE491B7523C161D, fd1044;
mul.f64 fd1047, fd1039, 0dBFEF838B8C811C17;
mul.f64 fd1651, fd1033, 0d3FC63A1A7E0B738A;
sub.f64 fd1048, fd1651, fd1047;
mul.f64 fd1049, fd1039, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd1050, fd1033, 0dBFEF838B8C811C17, fd1049;
mul.f64 fd1052, fd1024, 0dBFEF838B8C811C17;
mul.f64 fd1650, fd1018, 0d3FC63A1A7E0B738A;
sub.f64 fd1053, fd1650, fd1052;
mul.f64 fd1054, fd1024, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd1055, fd1018, 0dBFEF838B8C811C17, fd1054;
mul.f64 fd1057, fd1040, 0dBFD5E3A8748A0BF5;
mul.f64 fd1649, fd1034, 0dBFEE11F642522D1C;
sub.f64 fd1058, fd1649, fd1057;
mul.f64 fd1059, fd1040, 0dBFEE11F642522D1C;
fma.rn.f64 fd1060, fd1034, 0dBFD5E3A8748A0BF5, fd1059;
add.f64 fd1061, fd1010, fd1026;
add.f64 fd1062, fd994, fd1061;
mul.f64 fd1065, fd1061, 0d3FE0000000000000;
sub.f64 fd1066, fd994, fd1065;
add.f64 fd1648, fd1655, fd1653;
sub.f64 fd1067, fd1655, fd1653;
mul.f64 fd1068, fd1067, 0d3FEBB67AE8584CAA;
add.f64 fd1069, fd1068, fd1066;
sub.f64 fd1070, fd1066, fd1068;
add.f64 fd1647, fd1657, fd1648;
mul.f64 fd1071, fd1648, 0d3FE0000000000000;
sub.f64 fd1072, fd1657, fd1071;
sub.f64 fd1073, fd1010, fd1026;
mul.f64 fd1074, fd1073, 0d3FEBB67AE8584CAA;
sub.f64 fd1075, fd1072, fd1074;
add.f64 fd1076, fd1074, fd1072;
add.f64 fd1077, fd1043, fd1048;
add.f64 fd1078, fd1001, fd1077;
mul.f64 fd1081, fd1077, 0d3FE0000000000000;
sub.f64 fd1082, fd1001, fd1081;
add.f64 fd1646, fd1045, fd1050;
sub.f64 fd1083, fd1045, fd1050;
mul.f64 fd1084, fd1083, 0d3FEBB67AE8584CAA;
add.f64 fd1085, fd1084, fd1082;
sub.f64 fd1086, fd1082, fd1084;
add.f64 fd1645, fd1007, fd1646;
mul.f64 fd1087, fd1646, 0d3FE0000000000000;
sub.f64 fd1088, fd1007, fd1087;
sub.f64 fd1089, fd1043, fd1048;
mul.f64 fd1090, fd1089, 0d3FEBB67AE8584CAA;
sub.f64 fd1091, fd1088, fd1090;
add.f64 fd1092, fd1090, fd1088;
add.f64 fd1093, fd1053, fd1058;
add.f64 fd1094, fd1002, fd1093;
mul.f64 fd1097, fd1093, 0d3FE0000000000000;
sub.f64 fd1098, fd1002, fd1097;
add.f64 fd1644, fd1055, fd1060;
sub.f64 fd1099, fd1055, fd1060;
mul.f64 fd1100, fd1099, 0d3FEBB67AE8584CAA;
add.f64 fd1101, fd1100, fd1098;
sub.f64 fd1102, fd1098, fd1100;
add.f64 fd1643, fd1008, fd1644;
mul.f64 fd1103, fd1644, 0d3FE0000000000000;
sub.f64 fd1104, fd1008, fd1103;
sub.f64 fd1105, fd1053, fd1058;
mul.f64 fd1106, fd1105, 0d3FEBB67AE8584CAA;
sub.f64 fd1107, fd1104, fd1106;
add.f64 fd1108, fd1106, fd1104;
add.f64 fd1109, fd949, fd958;
add.f64 fd1110, fd940, fd1109;
mul.f64 fd1113, fd1109, 0d3FE0000000000000;
sub.f64 fd1114, fd940, fd1113;
add.f64 fd1642, fd976, fd985;
sub.f64 fd1115, fd976, fd985;
mul.f64 fd1116, fd1115, 0d3FEBB67AE8584CAA;
add.f64 fd1117, fd1116, fd1114;
sub.f64 fd1118, fd1114, fd1116;
add.f64 fd1641, fd967, fd1642;
mul.f64 fd1119, fd1642, 0d3FE0000000000000;
sub.f64 fd1120, fd967, fd1119;
sub.f64 fd1121, fd949, fd958;
mul.f64 fd1122, fd1121, 0d3FEBB67AE8584CAA;
sub.f64 fd1123, fd1120, fd1122;
add.f64 fd1124, fd1122, fd1120;
add.f64 fd1125, fd952, fd961;
add.f64 fd1126, fd943, fd1125;
mul.f64 fd1129, fd1125, 0d3FE0000000000000;
sub.f64 fd1130, fd943, fd1129;
add.f64 fd1640, fd979, fd988;
sub.f64 fd1131, fd979, fd988;
mul.f64 fd1132, fd1131, 0d3FEBB67AE8584CAA;
add.f64 fd1133, fd1132, fd1130;
sub.f64 fd1134, fd1130, fd1132;
add.f64 fd1639, fd970, fd1640;
mul.f64 fd1135, fd1640, 0d3FE0000000000000;
sub.f64 fd1136, fd970, fd1135;
sub.f64 fd1137, fd952, fd961;
mul.f64 fd1138, fd1137, 0d3FEBB67AE8584CAA;
sub.f64 fd1139, fd1136, fd1138;
add.f64 fd1140, fd1138, fd1136;
add.f64 fd1141, fd955, fd964;
add.f64 fd1142, fd946, fd1141;
mul.f64 fd1145, fd1141, 0d3FE0000000000000;
sub.f64 fd1146, fd946, fd1145;
add.f64 fd1638, fd982, fd991;
sub.f64 fd1147, fd982, fd991;
mul.f64 fd1148, fd1147, 0d3FEBB67AE8584CAA;
add.f64 fd1149, fd1148, fd1146;
sub.f64 fd1150, fd1146, fd1148;
add.f64 fd1637, fd973, fd1638;
mul.f64 fd1151, fd1638, 0d3FE0000000000000;
sub.f64 fd1152, fd973, fd1151;
sub.f64 fd1153, fd955, fd964;
mul.f64 fd1154, fd1153, 0d3FEBB67AE8584CAA;
sub.f64 fd1155, fd1152, fd1154;
add.f64 fd1156, fd1154, fd1152;
mul.f64 fd1158, fd1139, 0dBFE491B7523C161D;
mul.f64 fd1636, fd1133, 0d3FE8836FA2CF5039;
sub.f64 fd1159, fd1636, fd1158;
mul.f64 fd1160, fd1139, 0d3FE8836FA2CF5039;
fma.rn.f64 fd1161, fd1133, 0dBFE491B7523C161D, fd1160;
mul.f64 fd1163, fd1155, 0dBFEF838B8C811C17;
mul.f64 fd1635, fd1149, 0d3FC63A1A7E0B738A;
sub.f64 fd1164, fd1635, fd1163;
mul.f64 fd1165, fd1155, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd1166, fd1149, 0dBFEF838B8C811C17, fd1165;
mul.f64 fd1168, fd1140, 0dBFEF838B8C811C17;
mul.f64 fd1634, fd1134, 0d3FC63A1A7E0B738A;
sub.f64 fd1169, fd1634, fd1168;
mul.f64 fd1170, fd1140, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd1171, fd1134, 0dBFEF838B8C811C17, fd1170;
mul.f64 fd1173, fd1156, 0dBFD5E3A8748A0BF5;
mul.f64 fd1633, fd1150, 0dBFEE11F642522D1C;
sub.f64 fd1174, fd1633, fd1173;
mul.f64 fd1175, fd1156, 0dBFEE11F642522D1C;
fma.rn.f64 fd1176, fd1150, 0dBFD5E3A8748A0BF5, fd1175;
add.f64 fd1177, fd1126, fd1142;
add.f64 fd1178, fd1110, fd1177;
mul.f64 fd1181, fd1177, 0d3FE0000000000000;
sub.f64 fd1182, fd1110, fd1181;
add.f64 fd1632, fd1639, fd1637;
sub.f64 fd1183, fd1639, fd1637;
mul.f64 fd1184, fd1183, 0d3FEBB67AE8584CAA;
add.f64 fd1185, fd1184, fd1182;
sub.f64 fd1186, fd1182, fd1184;
add.f64 fd1631, fd1641, fd1632;
mul.f64 fd1187, fd1632, 0d3FE0000000000000;
sub.f64 fd1188, fd1641, fd1187;
sub.f64 fd1189, fd1126, fd1142;
mul.f64 fd1190, fd1189, 0d3FEBB67AE8584CAA;
sub.f64 fd1191, fd1188, fd1190;
add.f64 fd1192, fd1190, fd1188;
add.f64 fd1193, fd1159, fd1164;
add.f64 fd1194, fd1117, fd1193;
mul.f64 fd1197, fd1193, 0d3FE0000000000000;
sub.f64 fd1198, fd1117, fd1197;
add.f64 fd1630, fd1161, fd1166;
sub.f64 fd1199, fd1161, fd1166;
mul.f64 fd1200, fd1199, 0d3FEBB67AE8584CAA;
add.f64 fd1201, fd1200, fd1198;
sub.f64 fd1202, fd1198, fd1200;
add.f64 fd1629, fd1123, fd1630;
mul.f64 fd1203, fd1630, 0d3FE0000000000000;
sub.f64 fd1204, fd1123, fd1203;
sub.f64 fd1205, fd1159, fd1164;
mul.f64 fd1206, fd1205, 0d3FEBB67AE8584CAA;
sub.f64 fd1207, fd1204, fd1206;
add.f64 fd1208, fd1206, fd1204;
add.f64 fd1209, fd1169, fd1174;
add.f64 fd1210, fd1118, fd1209;
mul.f64 fd1213, fd1209, 0d3FE0000000000000;
sub.f64 fd1214, fd1118, fd1213;
add.f64 fd1628, fd1171, fd1176;
sub.f64 fd1215, fd1171, fd1176;
mul.f64 fd1216, fd1215, 0d3FEBB67AE8584CAA;
add.f64 fd1217, fd1216, fd1214;
sub.f64 fd1218, fd1214, fd1216;
add.f64 fd1627, fd1124, fd1628;
mul.f64 fd1219, fd1628, 0d3FE0000000000000;
sub.f64 fd1220, fd1124, fd1219;
sub.f64 fd1221, fd1169, fd1174;
mul.f64 fd1222, fd1221, 0d3FEBB67AE8584CAA;
sub.f64 fd1223, fd1220, fd1222;
add.f64 fd1224, fd1222, fd1220;
add.f64 fd1225, fd950, fd959;
add.f64 fd1226, fd941, fd1225;
mul.f64 fd1229, fd1225, 0d3FE0000000000000;
sub.f64 fd1230, fd941, fd1229;
add.f64 fd1626, fd977, fd986;
sub.f64 fd1231, fd977, fd986;
mul.f64 fd1232, fd1231, 0d3FEBB67AE8584CAA;
add.f64 fd1233, fd1232, fd1230;
sub.f64 fd1234, fd1230, fd1232;
add.f64 fd1625, fd968, fd1626;
mul.f64 fd1235, fd1626, 0d3FE0000000000000;
sub.f64 fd1236, fd968, fd1235;
sub.f64 fd1237, fd950, fd959;
mul.f64 fd1238, fd1237, 0d3FEBB67AE8584CAA;
sub.f64 fd1239, fd1236, fd1238;
add.f64 fd1240, fd1238, fd1236;
add.f64 fd1241, fd953, fd962;
add.f64 fd1242, fd944, fd1241;
mul.f64 fd1245, fd1241, 0d3FE0000000000000;
sub.f64 fd1246, fd944, fd1245;
add.f64 fd1624, fd980, fd989;
sub.f64 fd1247, fd980, fd989;
mul.f64 fd1248, fd1247, 0d3FEBB67AE8584CAA;
add.f64 fd1249, fd1248, fd1246;
sub.f64 fd1250, fd1246, fd1248;
add.f64 fd1623, fd971, fd1624;
mul.f64 fd1251, fd1624, 0d3FE0000000000000;
sub.f64 fd1252, fd971, fd1251;
sub.f64 fd1253, fd953, fd962;
mul.f64 fd1254, fd1253, 0d3FEBB67AE8584CAA;
sub.f64 fd1255, fd1252, fd1254;
add.f64 fd1256, fd1254, fd1252;
add.f64 fd1257, fd956, fd965;
add.f64 fd1258, fd947, fd1257;
mul.f64 fd1261, fd1257, 0d3FE0000000000000;
sub.f64 fd1262, fd947, fd1261;
add.f64 fd1622, fd983, fd992;
sub.f64 fd1263, fd983, fd992;
mul.f64 fd1264, fd1263, 0d3FEBB67AE8584CAA;
add.f64 fd1265, fd1264, fd1262;
sub.f64 fd1266, fd1262, fd1264;
add.f64 fd1621, fd974, fd1622;
mul.f64 fd1267, fd1622, 0d3FE0000000000000;
sub.f64 fd1268, fd974, fd1267;
sub.f64 fd1269, fd956, fd965;
mul.f64 fd1270, fd1269, 0d3FEBB67AE8584CAA;
sub.f64 fd1271, fd1268, fd1270;
add.f64 fd1272, fd1270, fd1268;
mul.f64 fd1274, fd1255, 0dBFE491B7523C161D;
mul.f64 fd1620, fd1249, 0d3FE8836FA2CF5039;
sub.f64 fd1275, fd1620, fd1274;
mul.f64 fd1276, fd1255, 0d3FE8836FA2CF5039;
fma.rn.f64 fd1277, fd1249, 0dBFE491B7523C161D, fd1276;
mul.f64 fd1279, fd1271, 0dBFEF838B8C811C17;
mul.f64 fd1619, fd1265, 0d3FC63A1A7E0B738A;
sub.f64 fd1280, fd1619, fd1279;
mul.f64 fd1281, fd1271, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd1282, fd1265, 0dBFEF838B8C811C17, fd1281;
mul.f64 fd1284, fd1256, 0dBFEF838B8C811C17;
mul.f64 fd1618, fd1250, 0d3FC63A1A7E0B738A;
sub.f64 fd1285, fd1618, fd1284;
mul.f64 fd1286, fd1256, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd1287, fd1250, 0dBFEF838B8C811C17, fd1286;
mul.f64 fd1289, fd1272, 0dBFD5E3A8748A0BF5;
mul.f64 fd1617, fd1266, 0dBFEE11F642522D1C;
sub.f64 fd1290, fd1617, fd1289;
mul.f64 fd1291, fd1272, 0dBFEE11F642522D1C;
fma.rn.f64 fd1292, fd1266, 0dBFD5E3A8748A0BF5, fd1291;
add.f64 fd1293, fd1242, fd1258;
add.f64 fd1294, fd1226, fd1293;
mul.f64 fd1297, fd1293, 0d3FE0000000000000;
sub.f64 fd1298, fd1226, fd1297;
add.f64 fd1616, fd1623, fd1621;
sub.f64 fd1299, fd1623, fd1621;
mul.f64 fd1300, fd1299, 0d3FEBB67AE8584CAA;
add.f64 fd1301, fd1300, fd1298;
sub.f64 fd1302, fd1298, fd1300;
add.f64 fd1615, fd1625, fd1616;
mul.f64 fd1303, fd1616, 0d3FE0000000000000;
sub.f64 fd1304, fd1625, fd1303;
sub.f64 fd1305, fd1242, fd1258;
mul.f64 fd1306, fd1305, 0d3FEBB67AE8584CAA;
sub.f64 fd1307, fd1304, fd1306;
add.f64 fd1308, fd1306, fd1304;
add.f64 fd1309, fd1275, fd1280;
add.f64 fd1310, fd1233, fd1309;
mul.f64 fd1313, fd1309, 0d3FE0000000000000;
sub.f64 fd1314, fd1233, fd1313;
add.f64 fd1614, fd1277, fd1282;
sub.f64 fd1315, fd1277, fd1282;
mul.f64 fd1316, fd1315, 0d3FEBB67AE8584CAA;
add.f64 fd1317, fd1316, fd1314;
sub.f64 fd1318, fd1314, fd1316;
add.f64 fd1613, fd1239, fd1614;
mul.f64 fd1319, fd1614, 0d3FE0000000000000;
sub.f64 fd1320, fd1239, fd1319;
sub.f64 fd1321, fd1275, fd1280;
mul.f64 fd1322, fd1321, 0d3FEBB67AE8584CAA;
sub.f64 fd1323, fd1320, fd1322;
add.f64 fd1324, fd1322, fd1320;
add.f64 fd1325, fd1285, fd1290;
add.f64 fd1326, fd1234, fd1325;
mul.f64 fd1329, fd1325, 0d3FE0000000000000;
sub.f64 fd1330, fd1234, fd1329;
add.f64 fd1612, fd1287, fd1292;
sub.f64 fd1331, fd1287, fd1292;
mul.f64 fd1332, fd1331, 0d3FEBB67AE8584CAA;
add.f64 fd1333, fd1332, fd1330;
sub.f64 fd1334, fd1330, fd1332;
add.f64 fd1611, fd1240, fd1612;
mul.f64 fd1335, fd1612, 0d3FE0000000000000;
sub.f64 fd1336, fd1240, fd1335;
sub.f64 fd1337, fd1285, fd1290;
mul.f64 fd1338, fd1337, 0d3FEBB67AE8584CAA;
sub.f64 fd1339, fd1336, fd1338;
add.f64 fd1340, fd1338, fd1336;
mul.f64 fd1609, fd1194, 0d3FEF232EFF15C9E6;
mul.f64 fd1610, fd1629, 0dBFCD84D223638000;
sub.f64 fd1343, fd1609, fd1610;
mul.f64 fd1344, fd1629, 0d3FEF232EFF15C9E6;
fma.rn.f64 fd1345, fd1194, 0dBFCD84D223638000, fd1344;
mul.f64 fd1607, fd1310, 0d3FEC98A37A9A7850;
mul.f64 fd1608, fd1613, 0dBFDCB920325BAFA6;
sub.f64 fd1348, fd1607, fd1608;
mul.f64 fd1349, fd1613, 0d3FEC98A37A9A7850;
fma.rn.f64 fd1350, fd1310, 0dBFDCB920325BAFA6, fd1349;
mul.f64 fd1605, fd1210, 0d3FEC98A37A9A7850;
mul.f64 fd1606, fd1627, 0dBFDCB920325BAFA6;
sub.f64 fd1353, fd1605, fd1606;
mul.f64 fd1354, fd1627, 0d3FEC98A37A9A7850;
fma.rn.f64 fd1355, fd1210, 0dBFDCB920325BAFA6, fd1354;
mul.f64 fd1357, fd1611, 0dBFE9AAFE4207DF5F;
mul.f64 fd1604, fd1326, 0d3FE31BEC55BC71BC;
sub.f64 fd1358, fd1604, fd1357;
mul.f64 fd1359, fd1611, 0d3FE31BEC55BC71BC;
fma.rn.f64 fd1360, fd1326, 0dBFE9AAFE4207DF5F, fd1359;
mul.f64 fd1362, fd1191, 0dBFE491B7523C161D;
mul.f64 fd1603, fd1185, 0d3FE8836FA2CF5039;
sub.f64 fd1363, fd1603, fd1362;
mul.f64 fd1364, fd1191, 0d3FE8836FA2CF5039;
fma.rn.f64 fd1365, fd1185, 0dBFE491B7523C161D, fd1364;
mul.f64 fd1367, fd1307, 0dBFEF838B8C811C17;
mul.f64 fd1602, fd1301, 0d3FC63A1A7E0B738A;
sub.f64 fd1368, fd1602, fd1367;
mul.f64 fd1369, fd1307, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd1370, fd1301, 0dBFEF838B8C811C17, fd1369;
mul.f64 fd1372, fd1207, 0dBFE9AAFE4207DF5F;
mul.f64 fd1601, fd1201, 0d3FE31BEC55BC71BC;
sub.f64 fd1373, fd1601, fd1372;
mul.f64 fd1374, fd1207, 0d3FE31BEC55BC71BC;
fma.rn.f64 fd1375, fd1201, 0dBFE9AAFE4207DF5F, fd1374;
mul.f64 fd1377, fd1323, 0dBFEEA7D99F29CADE;
mul.f64 fd1600, fd1317, 0dBFD25AFBF23865BF;
sub.f64 fd1378, fd1600, fd1377;
mul.f64 fd1379, fd1323, 0dBFD25AFBF23865BF;
fma.rn.f64 fd1380, fd1317, 0dBFEEA7D99F29CADE, fd1379;
mul.f64 fd1598, fd1217, 0d3FD9595EF26FB670;
mul.f64 fd1599, fd1223, 0dBFED6206BEB6C24B;
sub.f64 fd1383, fd1598, fd1599;
mul.f64 fd1384, fd1223, 0d3FD9595EF26FB670;
fma.rn.f64 fd1385, fd1217, 0dBFED6206BEB6C24B, fd1384;
mul.f64 fd1596, fd1333, 0dBFE5F5B105F99707;
mul.f64 fd1597, fd1339, 0dBFE746A51650EADE;
sub.f64 fd1388, fd1596, fd1597;
mul.f64 fd1389, fd1339, 0dBFE5F5B105F99707;
fma.rn.f64 fd1390, fd1333, 0dBFE746A51650EADE, fd1389;
mul.f64 fd1594, fd1186, 0d3FC63A1A7E0B738A;
mul.f64 fd1595, fd1192, 0dBFEF838B8C811C17;
sub.f64 fd1393, fd1594, fd1595;
mul.f64 fd1394, fd1192, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd1395, fd1186, 0dBFEF838B8C811C17, fd1394;
mul.f64 fd1592, fd1302, 0dBFEE11F642522D1C;
mul.f64 fd1593, fd1308, 0dBFD5E3A8748A0BF5;
sub.f64 fd1398, fd1592, fd1593;
mul.f64 fd1399, fd1308, 0dBFEE11F642522D1C;
fma.rn.f64 fd1400, fd1302, 0dBFD5E3A8748A0BF5, fd1399;
mul.f64 fd1402, fd1208, 0dBFEFF223F3635CE3;
mul.f64 fd1591, fd1202, 0dBFADC528B5343A86;
sub.f64 fd1403, fd1591, fd1402;
mul.f64 fd1404, fd1208, 0dBFADC528B5343A86;
fma.rn.f64 fd1405, fd1202, 0dBFEFF223F3635CE3, fd1404;
mul.f64 fd1407, fd1324, 0d3FBDB843E577175E;
mul.f64 fd1590, fd1318, 0dBFEFC89BCEF44CF4;
sub.f64 fd1408, fd1590, fd1407;
mul.f64 fd1409, fd1324, 0dBFEFC89BCEF44CF4;
fma.rn.f64 fd1410, fd1318, 0d3FBDB843E577175E, fd1409;
mul.f64 fd1412, fd1224, 0dBFEEA7D99F29CADE;
mul.f64 fd1589, fd1218, 0dBFD25AFBF23865BF;
sub.f64 fd1413, fd1589, fd1412;
mul.f64 fd1414, fd1224, 0dBFD25AFBF23865BF;
fma.rn.f64 fd1415, fd1218, 0dBFEEA7D99F29CADE, fd1414;
mul.f64 fd1417, fd1340, 0d3FE19593DA358510;
mul.f64 fd1588, fd1334, 0dBFEABC50EF4734A7;
sub.f64 fd1418, fd1588, fd1417;
mul.f64 fd1419, fd1340, 0dBFEABC50EF4734A7;
fma.rn.f64 fd1420, fd1334, 0d3FE19593DA358510, fd1419;
add.f64 fd1421, fd1178, fd1294;
mul.f64 fd1423, fd1421, 0d3FE0000000000000;
sub.f64 fd1424, fd1062, fd1423;
add.f64 fd1587, fd1631, fd1615;
sub.f64 fd1425, fd1631, fd1615;
mul.f64 fd1426, fd1425, 0d3FEBB67AE8584CAA;
mul.f64 fd1427, fd1587, 0d3FE0000000000000;
sub.f64 fd1428, fd1647, fd1427;
sub.f64 fd1429, fd1178, fd1294;
mul.f64 fd1430, fd1429, 0d3FEBB67AE8584CAA;
add.f64 fd1431, fd1343, fd1348;
mul.f64 fd1433, fd1431, 0d3FE0000000000000;
sub.f64 fd1434, fd1078, fd1433;
add.f64 fd1586, fd1345, fd1350;
sub.f64 fd1435, fd1345, fd1350;
mul.f64 fd1436, fd1435, 0d3FEBB67AE8584CAA;
mul.f64 fd1437, fd1586, 0d3FE0000000000000;
sub.f64 fd1438, fd1645, fd1437;
sub.f64 fd1439, fd1343, fd1348;
mul.f64 fd1440, fd1439, 0d3FEBB67AE8584CAA;
add.f64 fd1441, fd1353, fd1358;
mul.f64 fd1443, fd1441, 0d3FE0000000000000;
sub.f64 fd1444, fd1094, fd1443;
add.f64 fd1585, fd1355, fd1360;
sub.f64 fd1445, fd1355, fd1360;
mul.f64 fd1446, fd1445, 0d3FEBB67AE8584CAA;
mul.f64 fd1447, fd1585, 0d3FE0000000000000;
sub.f64 fd1448, fd1643, fd1447;
sub.f64 fd1449, fd1353, fd1358;
mul.f64 fd1450, fd1449, 0d3FEBB67AE8584CAA;
add.f64 fd1451, fd1363, fd1368;
mul.f64 fd1453, fd1451, 0d3FE0000000000000;
sub.f64 fd1454, fd1069, fd1453;
add.f64 fd1584, fd1365, fd1370;
sub.f64 fd1455, fd1365, fd1370;
mul.f64 fd1456, fd1455, 0d3FEBB67AE8584CAA;
mul.f64 fd1457, fd1584, 0d3FE0000000000000;
sub.f64 fd1458, fd1075, fd1457;
sub.f64 fd1459, fd1363, fd1368;
mul.f64 fd1460, fd1459, 0d3FEBB67AE8584CAA;
add.f64 fd1461, fd1373, fd1378;
mul.f64 fd1463, fd1461, 0d3FE0000000000000;
sub.f64 fd1464, fd1085, fd1463;
add.f64 fd1583, fd1375, fd1380;
sub.f64 fd1465, fd1375, fd1380;
mul.f64 fd1466, fd1465, 0d3FEBB67AE8584CAA;
mul.f64 fd1467, fd1583, 0d3FE0000000000000;
sub.f64 fd1468, fd1091, fd1467;
sub.f64 fd1469, fd1373, fd1378;
mul.f64 fd1470, fd1469, 0d3FEBB67AE8584CAA;
add.f64 fd1471, fd1383, fd1388;
mul.f64 fd1473, fd1471, 0d3FE0000000000000;
sub.f64 fd1474, fd1101, fd1473;
add.f64 fd1582, fd1385, fd1390;
sub.f64 fd1475, fd1385, fd1390;
mul.f64 fd1476, fd1475, 0d3FEBB67AE8584CAA;
mul.f64 fd1477, fd1582, 0d3FE0000000000000;
sub.f64 fd1478, fd1107, fd1477;
sub.f64 fd1479, fd1383, fd1388;
mul.f64 fd1480, fd1479, 0d3FEBB67AE8584CAA;
add.f64 fd1481, fd1393, fd1398;
mul.f64 fd1483, fd1481, 0d3FE0000000000000;
sub.f64 fd1484, fd1070, fd1483;
add.f64 fd1581, fd1395, fd1400;
sub.f64 fd1485, fd1395, fd1400;
mul.f64 fd1486, fd1485, 0d3FEBB67AE8584CAA;
mul.f64 fd1487, fd1581, 0d3FE0000000000000;
sub.f64 fd1488, fd1076, fd1487;
sub.f64 fd1489, fd1393, fd1398;
mul.f64 fd1490, fd1489, 0d3FEBB67AE8584CAA;
add.f64 fd1491, fd1403, fd1408;
mul.f64 fd1493, fd1491, 0d3FE0000000000000;
sub.f64 fd1494, fd1086, fd1493;
add.f64 fd1580, fd1405, fd1410;
sub.f64 fd1495, fd1405, fd1410;
mul.f64 fd1496, fd1495, 0d3FEBB67AE8584CAA;
mul.f64 fd1497, fd1580, 0d3FE0000000000000;
sub.f64 fd1498, fd1092, fd1497;
sub.f64 fd1499, fd1403, fd1408;
mul.f64 fd1500, fd1499, 0d3FEBB67AE8584CAA;
add.f64 fd1501, fd1413, fd1418;
mul.f64 fd1503, fd1501, 0d3FE0000000000000;
sub.f64 fd1504, fd1102, fd1503;
add.f64 fd1579, fd1415, fd1420;
sub.f64 fd1505, fd1415, fd1420;
mul.f64 fd1506, fd1505, 0d3FEBB67AE8584CAA;
mul.f64 fd1507, fd1579, 0d3FE0000000000000;
sub.f64 fd1508, fd1108, fd1507;
sub.f64 fd1509, fd1413, fd1418;
mul.f64 fd1843, fd1431, 0d3FE0000000000000;
sub.f64 fd1842, fd1078, fd1843;
mul.f64 fd1510, fd1509, 0d3FEBB67AE8584CAA;
add.f64 %0, fd1062, fd1421;
mul.f64 fd1845, fd1585, 0d3FE0000000000000;
sub.f64 fd1844, fd1643, fd1845;
add.f64 %1, fd1647, fd1587;
mul.f64 fd1847, fd1586, 0d3FE0000000000000;
sub.f64 fd1846, fd1645, fd1847;
mul.f64 fd1849, fd1501, 0d3FE0000000000000;
sub.f64 fd1848, fd1102, fd1849;
add.f64 %3, fd1645, fd1586;
add.f64 %2, fd1078, fd1431;
add.f64 %5, fd1643, fd1585;
add.f64 %4, fd1094, fd1441;
add.f64 %7, fd1075, fd1584;
add.f64 %6, fd1069, fd1451;
add.f64 %9, fd1091, fd1583;
add.f64 %8, fd1085, fd1461;
add.f64 %11, fd1107, fd1582;
add.f64 %10, fd1101, fd1471;
add.f64 %13, fd1076, fd1581;
add.f64 %12, fd1070, fd1481;
add.f64 %15, fd1092, fd1580;
add.f64 %14, fd1086, fd1491;
add.f64 %17, fd1108, fd1579;
add.f64 %16, fd1102, fd1501;
sub.f64 %19, fd1428, fd1430;
add.f64 %18, fd1426, fd1424;
sub.f64 %21, fd1846, fd1440;
add.f64 %20, fd1436, fd1842;
sub.f64 %23, fd1844, fd1450;
add.f64 %22, fd1446, fd1444;
sub.f64 %25, fd1458, fd1460;
add.f64 %24, fd1456, fd1454;
add.f64 %26, fd1466, fd1464;
sub.f64 %27, fd1468, fd1470;
add.f64 %28, fd1476, fd1474;
sub.f64 %29, fd1478, fd1480;
add.f64 %30, fd1486, fd1484;
sub.f64 %31, fd1488, fd1490;
sub.f64 %33, fd1498, fd1500;
add.f64 %32, fd1496, fd1494;
sub.f64 %35, fd1508, fd1510;
add.f64 %34, fd1506, fd1848;
sub.f64 %36, fd1424, fd1426;
add.f64 %37, fd1430, fd1428;
add.f64 %39, fd1440, fd1846;
sub.f64 %38, fd1842, fd1436;
add.f64 %41, fd1450, fd1844;
sub.f64 %40, fd1444, fd1446;
add.f64 %43, fd1460, fd1458;
sub.f64 %42, fd1454, fd1456;
add.f64 %45, fd1470, fd1468;
sub.f64 %44, fd1464, fd1466;
add.f64 %47, fd1480, fd1478;
sub.f64 %46, fd1474, fd1476;
add.f64 %49, fd1490, fd1488;
sub.f64 %48, fd1484, fd1486;
add.f64 %51, fd1500, fd1498;
sub.f64 %50, fd1494, fd1496;
add.f64 %53, fd1510, fd1508;
sub.f64 %52, fd1848, fd1506;
})"
     : "=d"(rmem[0].x), "=d"(rmem[0].y), "=d"(rmem[1].x), "=d"(rmem[1].y), "=d"(rmem[2].x), "=d"(rmem[2].y), "=d"(rmem[3].x), "=d"(rmem[3].y), "=d"(rmem[4].x), "=d"(rmem[4].y), "=d"(rmem[5].x), "=d"(rmem[5].y), "=d"(rmem[6].x), "=d"(rmem[6].y), "=d"(rmem[7].x), "=d"(rmem[7].y), "=d"(rmem[8].x), "=d"(rmem[8].y), "=d"(rmem[9].x), "=d"(rmem[9].y), "=d"(rmem[10].x), "=d"(rmem[10].y), "=d"(rmem[11].x), "=d"(rmem[11].y), "=d"(rmem[12].x), "=d"(rmem[12].y), "=d"(rmem[13].x), "=d"(rmem[13].y), "=d"(rmem[14].x), "=d"(rmem[14].y), "=d"(rmem[15].x), "=d"(rmem[15].y), "=d"(rmem[16].x), "=d"(rmem[16].y), "=d"(rmem[17].x), "=d"(rmem[17].y), "=d"(rmem[18].x), "=d"(rmem[18].y), "=d"(rmem[19].x), "=d"(rmem[19].y), "=d"(rmem[20].x), "=d"(rmem[20].y), "=d"(rmem[21].x), "=d"(rmem[21].y), "=d"(rmem[22].x), "=d"(rmem[22].y), "=d"(rmem[23].x), "=d"(rmem[23].y), "=d"(rmem[24].x), "=d"(rmem[24].y), "=d"(rmem[25].x), "=d"(rmem[25].y), "=d"(rmem[26].x), "=d"(rmem[26].y): "r"(smem), "l"(lut_dp_27_729), "d"(rmem[0].x), "d"(rmem[0].y), "d"(rmem[1].x), "d"(rmem[1].y), "d"(rmem[2].x), "d"(rmem[2].y), "d"(rmem[3].x), "d"(rmem[3].y), "d"(rmem[4].x), "d"(rmem[4].y), "d"(rmem[5].x), "d"(rmem[5].y), "d"(rmem[6].x), "d"(rmem[6].y), "d"(rmem[7].x), "d"(rmem[7].y), "d"(rmem[8].x), "d"(rmem[8].y), "d"(rmem[9].x), "d"(rmem[9].y), "d"(rmem[10].x), "d"(rmem[10].y), "d"(rmem[11].x), "d"(rmem[11].y), "d"(rmem[12].x), "d"(rmem[12].y), "d"(rmem[13].x), "d"(rmem[13].y), "d"(rmem[14].x), "d"(rmem[14].y), "d"(rmem[15].x), "d"(rmem[15].y), "d"(rmem[16].x), "d"(rmem[16].y), "d"(rmem[17].x), "d"(rmem[17].y), "d"(rmem[18].x), "d"(rmem[18].y), "d"(rmem[19].x), "d"(rmem[19].y), "d"(rmem[20].x), "d"(rmem[20].y), "d"(rmem[21].x), "d"(rmem[21].y), "d"(rmem[22].x), "d"(rmem[22].y), "d"(rmem[23].x), "d"(rmem[23].y), "d"(rmem[24].x), "d"(rmem[24].y), "d"(rmem[25].x), "d"(rmem[25].y), "d"(rmem[26].x), "d"(rmem[26].y), "d"(rmem[10].y), "d"(rmem[19].y), "d"(rmem[1].y), "d"(rmem[22].y), "d"(rmem[13].y), "d"(rmem[4].y), "d"(rmem[16].y), "d"(rmem[25].y), "d"(rmem[7].y), "d"(rmem[11].y), "d"(rmem[20].y), "d"(rmem[2].y), "d"(rmem[23].y), "d"(rmem[14].y), "d"(rmem[5].y), "d"(rmem[17].y), "d"(rmem[8].y));
};




template<> __forceinline__ __device__ void cufftdx_private_function<524, double, 1>(cufftdx::detail::complex<double> *rmem, unsigned smem){

asm volatile (R"({
.reg .b32 r<18>;
.reg .f64 fd<1887>;
.reg .b64 rd<10>;
mov.u32 r16, %tid.y;
mov.u32 r17, %54;
mad.lo.s32 r3, r16, 11664, r17;
add.f64 fd109, %74, %92;
add.f64 fd110, %56, fd109;
mul.f64 fd113, fd109, 0d3FE0000000000000;
sub.f64 fd114, %56, fd113;
add.f64 fd1886, %75, %93;
sub.f64 fd115, %75, %93;
mul.f64 fd116, fd115, 0d3FEBB67AE8584CAA;
add.f64 fd117, fd116, fd114;
sub.f64 fd118, fd114, fd116;
add.f64 fd1885, %57, fd1886;
mul.f64 fd119, fd1886, 0d3FE0000000000000;
sub.f64 fd120, %57, fd119;
sub.f64 fd121, %74, %92;
mul.f64 fd122, fd121, 0d3FEBB67AE8584CAA;
sub.f64 fd123, fd120, fd122;
add.f64 fd124, fd122, fd120;
add.f64 fd125, %80, %98;
add.f64 fd126, %62, fd125;
mul.f64 fd129, fd125, 0d3FE0000000000000;
sub.f64 fd130, %62, fd129;
add.f64 fd1884, %81, %99;
sub.f64 fd131, %81, %99;
mul.f64 fd132, fd131, 0d3FEBB67AE8584CAA;
add.f64 fd133, fd132, fd130;
sub.f64 fd134, fd130, fd132;
add.f64 fd1883, %63, fd1884;
mul.f64 fd135, fd1884, 0d3FE0000000000000;
sub.f64 fd136, %63, fd135;
sub.f64 fd137, %80, %98;
mul.f64 fd138, fd137, 0d3FEBB67AE8584CAA;
sub.f64 fd139, fd136, fd138;
add.f64 fd140, fd138, fd136;
add.f64 fd141, %86, %104;
add.f64 fd142, %68, fd141;
mul.f64 fd145, fd141, 0d3FE0000000000000;
sub.f64 fd146, %68, fd145;
add.f64 fd1882, %87, %105;
sub.f64 fd147, %87, %105;
mul.f64 fd148, fd147, 0d3FEBB67AE8584CAA;
add.f64 fd149, fd148, fd146;
sub.f64 fd150, fd146, fd148;
add.f64 fd1881, %69, fd1882;
mul.f64 fd151, fd1882, 0d3FE0000000000000;
sub.f64 fd152, %69, fd151;
sub.f64 fd153, %86, %104;
mul.f64 fd154, fd153, 0d3FEBB67AE8584CAA;
sub.f64 fd155, fd152, fd154;
add.f64 fd156, fd154, fd152;
mul.f64 fd158, fd139, 0dBFE491B7523C161D;
mul.f64 fd1880, fd133, 0d3FE8836FA2CF5039;
sub.f64 fd159, fd1880, fd158;
mul.f64 fd160, fd139, 0d3FE8836FA2CF5039;
fma.rn.f64 fd161, fd133, 0dBFE491B7523C161D, fd160;
mul.f64 fd1878, fd149, 0d3FC63A1A7E0B738A;
mul.f64 fd1879, fd155, 0dBFEF838B8C811C17;
sub.f64 fd164, fd1878, fd1879;
mul.f64 fd165, fd155, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd166, fd149, 0dBFEF838B8C811C17, fd165;
mul.f64 fd1876, fd134, 0d3FC63A1A7E0B738A;
mul.f64 fd1877, fd140, 0dBFEF838B8C811C17;
sub.f64 fd169, fd1876, fd1877;
mul.f64 fd170, fd140, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd171, fd134, 0dBFEF838B8C811C17, fd170;
mul.f64 fd1874, fd150, 0dBFEE11F642522D1C;
mul.f64 fd1875, fd156, 0dBFD5E3A8748A0BF5;
sub.f64 fd174, fd1874, fd1875;
mul.f64 fd175, fd156, 0dBFEE11F642522D1C;
fma.rn.f64 fd176, fd150, 0dBFD5E3A8748A0BF5, fd175;
add.f64 fd177, fd126, fd142;
add.f64 fd178, fd110, fd177;
mul.f64 fd181, fd177, 0d3FE0000000000000;
sub.f64 fd182, fd110, fd181;
add.f64 fd1873, fd1883, fd1881;
sub.f64 fd183, fd1883, fd1881;
mul.f64 fd184, fd183, 0d3FEBB67AE8584CAA;
add.f64 fd185, fd184, fd182;
sub.f64 fd186, fd182, fd184;
add.f64 fd1872, fd1885, fd1873;
mul.f64 fd187, fd1873, 0d3FE0000000000000;
sub.f64 fd188, fd1885, fd187;
sub.f64 fd189, fd126, fd142;
mul.f64 fd190, fd189, 0d3FEBB67AE8584CAA;
sub.f64 fd191, fd188, fd190;
add.f64 fd192, fd190, fd188;
add.f64 fd193, fd159, fd164;
add.f64 fd194, fd117, fd193;
mul.f64 fd197, fd193, 0d3FE0000000000000;
sub.f64 fd198, fd117, fd197;
add.f64 fd1871, fd161, fd166;
sub.f64 fd199, fd161, fd166;
mul.f64 fd200, fd199, 0d3FEBB67AE8584CAA;
add.f64 fd201, fd200, fd198;
sub.f64 fd202, fd198, fd200;
add.f64 fd1870, fd123, fd1871;
mul.f64 fd203, fd1871, 0d3FE0000000000000;
sub.f64 fd204, fd123, fd203;
sub.f64 fd205, fd159, fd164;
mul.f64 fd206, fd205, 0d3FEBB67AE8584CAA;
sub.f64 fd207, fd204, fd206;
add.f64 fd208, fd206, fd204;
add.f64 fd209, fd169, fd174;
add.f64 fd210, fd118, fd209;
mul.f64 fd213, fd209, 0d3FE0000000000000;
sub.f64 fd214, fd118, fd213;
add.f64 fd1869, fd171, fd176;
sub.f64 fd215, fd171, fd176;
mul.f64 fd216, fd215, 0d3FEBB67AE8584CAA;
add.f64 fd217, fd216, fd214;
sub.f64 fd218, fd214, fd216;
add.f64 fd1868, fd124, fd1869;
mul.f64 fd219, fd1869, 0d3FE0000000000000;
sub.f64 fd220, fd124, fd219;
sub.f64 fd221, fd169, fd174;
mul.f64 fd222, fd221, 0d3FEBB67AE8584CAA;
sub.f64 fd223, fd220, fd222;
add.f64 fd224, fd222, fd220;
add.f64 fd225, %76, %94;
add.f64 fd226, %58, fd225;
mul.f64 fd229, fd225, 0d3FE0000000000000;
sub.f64 fd230, %58, fd229;
add.f64 fd1865, %110, %111;
sub.f64 fd231, %110, %111;
mul.f64 fd232, fd231, 0d3FEBB67AE8584CAA;
add.f64 fd233, fd232, fd230;
sub.f64 fd234, fd230, fd232;
add.f64 fd1863, %112, fd1865;
mul.f64 fd235, fd1865, 0d3FE0000000000000;
sub.f64 fd236, %112, fd235;
sub.f64 fd237, %76, %94;
mul.f64 fd238, fd237, 0d3FEBB67AE8584CAA;
sub.f64 fd239, fd236, fd238;
add.f64 fd240, fd238, fd236;
add.f64 fd241, %82, %100;
add.f64 fd242, %64, fd241;
mul.f64 fd245, fd241, 0d3FE0000000000000;
sub.f64 fd246, %64, fd245;
add.f64 fd1860, %114, %113;
sub.f64 fd247, %114, %113;
mul.f64 fd248, fd247, 0d3FEBB67AE8584CAA;
add.f64 fd249, fd248, fd246;
sub.f64 fd250, fd246, fd248;
add.f64 fd1858, %115, fd1860;
mul.f64 fd251, fd1860, 0d3FE0000000000000;
sub.f64 fd252, %115, fd251;
sub.f64 fd253, %82, %100;
mul.f64 fd254, fd253, 0d3FEBB67AE8584CAA;
sub.f64 fd255, fd252, fd254;
add.f64 fd256, fd254, fd252;
add.f64 fd257, %88, %106;
add.f64 fd258, %70, fd257;
mul.f64 fd261, fd257, 0d3FE0000000000000;
sub.f64 fd262, %70, fd261;
add.f64 fd1855, %116, %117;
sub.f64 fd263, %116, %117;
mul.f64 fd264, fd263, 0d3FEBB67AE8584CAA;
add.f64 fd265, fd264, fd262;
sub.f64 fd266, fd262, fd264;
add.f64 fd1853, %118, fd1855;
mul.f64 fd267, fd1855, 0d3FE0000000000000;
sub.f64 fd268, %118, fd267;
sub.f64 fd269, %88, %106;
mul.f64 fd270, fd269, 0d3FEBB67AE8584CAA;
sub.f64 fd271, fd268, fd270;
add.f64 fd272, fd270, fd268;
mul.f64 fd274, fd255, 0dBFE491B7523C161D;
mul.f64 fd1852, fd249, 0d3FE8836FA2CF5039;
sub.f64 fd275, fd1852, fd274;
mul.f64 fd276, fd255, 0d3FE8836FA2CF5039;
fma.rn.f64 fd277, fd249, 0dBFE491B7523C161D, fd276;
mul.f64 fd279, fd271, 0dBFEF838B8C811C17;
mul.f64 fd1851, fd265, 0d3FC63A1A7E0B738A;
sub.f64 fd280, fd1851, fd279;
mul.f64 fd281, fd271, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd282, fd265, 0dBFEF838B8C811C17, fd281;
mul.f64 fd1849, fd250, 0d3FC63A1A7E0B738A;
mul.f64 fd1850, fd256, 0dBFEF838B8C811C17;
sub.f64 fd285, fd1849, fd1850;
mul.f64 fd286, fd256, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd287, fd250, 0dBFEF838B8C811C17, fd286;
mul.f64 fd1847, fd266, 0dBFEE11F642522D1C;
mul.f64 fd1848, fd272, 0dBFD5E3A8748A0BF5;
sub.f64 fd290, fd1847, fd1848;
mul.f64 fd291, fd272, 0dBFEE11F642522D1C;
fma.rn.f64 fd292, fd266, 0dBFD5E3A8748A0BF5, fd291;
add.f64 fd293, fd242, fd258;
add.f64 fd294, fd226, fd293;
mul.f64 fd297, fd293, 0d3FE0000000000000;
sub.f64 fd298, fd226, fd297;
add.f64 fd1846, fd1858, fd1853;
sub.f64 fd299, fd1858, fd1853;
mul.f64 fd300, fd299, 0d3FEBB67AE8584CAA;
add.f64 fd301, fd300, fd298;
sub.f64 fd302, fd298, fd300;
add.f64 fd1845, fd1863, fd1846;
mul.f64 fd303, fd1846, 0d3FE0000000000000;
sub.f64 fd304, fd1863, fd303;
sub.f64 fd305, fd242, fd258;
mul.f64 fd306, fd305, 0d3FEBB67AE8584CAA;
sub.f64 fd307, fd304, fd306;
add.f64 fd308, fd306, fd304;
add.f64 fd309, fd275, fd280;
add.f64 fd310, fd233, fd309;
mul.f64 fd313, fd309, 0d3FE0000000000000;
sub.f64 fd314, fd233, fd313;
add.f64 fd1844, fd277, fd282;
sub.f64 fd315, fd277, fd282;
mul.f64 fd316, fd315, 0d3FEBB67AE8584CAA;
add.f64 fd317, fd316, fd314;
sub.f64 fd318, fd314, fd316;
add.f64 fd1843, fd239, fd1844;
mul.f64 fd319, fd1844, 0d3FE0000000000000;
sub.f64 fd320, fd239, fd319;
sub.f64 fd321, fd275, fd280;
mul.f64 fd322, fd321, 0d3FEBB67AE8584CAA;
sub.f64 fd323, fd320, fd322;
add.f64 fd324, fd322, fd320;
add.f64 fd325, fd285, fd290;
add.f64 fd326, fd234, fd325;
mul.f64 fd329, fd325, 0d3FE0000000000000;
sub.f64 fd330, fd234, fd329;
add.f64 fd1842, fd287, fd292;
sub.f64 fd331, fd287, fd292;
mul.f64 fd332, fd331, 0d3FEBB67AE8584CAA;
add.f64 fd333, fd332, fd330;
sub.f64 fd334, fd330, fd332;
add.f64 fd1841, fd240, fd1842;
mul.f64 fd335, fd1842, 0d3FE0000000000000;
sub.f64 fd336, fd240, fd335;
sub.f64 fd337, fd285, fd290;
mul.f64 fd338, fd337, 0d3FEBB67AE8584CAA;
sub.f64 fd339, fd336, fd338;
add.f64 fd340, fd338, fd336;
add.f64 fd341, %78, %96;
add.f64 fd342, %60, fd341;
mul.f64 fd345, fd341, 0d3FE0000000000000;
sub.f64 fd346, %60, fd345;
add.f64 fd1838, %119, %120;
sub.f64 fd347, %119, %120;
mul.f64 fd348, fd347, 0d3FEBB67AE8584CAA;
add.f64 fd349, fd348, fd346;
sub.f64 fd350, fd346, fd348;
add.f64 fd1836, %121, fd1838;
mul.f64 fd351, fd1838, 0d3FE0000000000000;
sub.f64 fd352, %121, fd351;
sub.f64 fd353, %78, %96;
mul.f64 fd354, fd353, 0d3FEBB67AE8584CAA;
sub.f64 fd355, fd352, fd354;
add.f64 fd356, fd354, fd352;
add.f64 fd357, %84, %102;
add.f64 fd358, %66, fd357;
mul.f64 fd361, fd357, 0d3FE0000000000000;
sub.f64 fd362, %66, fd361;
add.f64 fd1833, %123, %122;
sub.f64 fd363, %123, %122;
mul.f64 fd364, fd363, 0d3FEBB67AE8584CAA;
add.f64 fd365, fd364, fd362;
sub.f64 fd366, fd362, fd364;
add.f64 fd1831, %124, fd1833;
mul.f64 fd367, fd1833, 0d3FE0000000000000;
sub.f64 fd368, %124, fd367;
sub.f64 fd369, %84, %102;
mul.f64 fd370, fd369, 0d3FEBB67AE8584CAA;
sub.f64 fd371, fd368, fd370;
add.f64 fd372, fd370, fd368;
add.f64 fd373, %90, %108;
add.f64 fd374, %72, fd373;
mul.f64 fd377, fd373, 0d3FE0000000000000;
sub.f64 fd378, %72, fd377;
add.f64 fd1829, %125, %109;
sub.f64 fd379, %125, %109;
mul.f64 fd380, fd379, 0d3FEBB67AE8584CAA;
add.f64 fd381, fd380, fd378;
sub.f64 fd382, fd378, fd380;
add.f64 fd1827, %126, fd1829;
mul.f64 fd383, fd1829, 0d3FE0000000000000;
sub.f64 fd384, %126, fd383;
sub.f64 fd385, %90, %108;
mul.f64 fd386, fd385, 0d3FEBB67AE8584CAA;
sub.f64 fd387, fd384, fd386;
add.f64 fd388, fd386, fd384;
mul.f64 fd390, fd371, 0dBFE491B7523C161D;
mul.f64 fd1826, fd365, 0d3FE8836FA2CF5039;
sub.f64 fd391, fd1826, fd390;
mul.f64 fd392, fd371, 0d3FE8836FA2CF5039;
fma.rn.f64 fd393, fd365, 0dBFE491B7523C161D, fd392;
mul.f64 fd395, fd387, 0dBFEF838B8C811C17;
mul.f64 fd1825, fd381, 0d3FC63A1A7E0B738A;
sub.f64 fd396, fd1825, fd395;
mul.f64 fd397, fd387, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd398, fd381, 0dBFEF838B8C811C17, fd397;
mul.f64 fd1823, fd366, 0d3FC63A1A7E0B738A;
mul.f64 fd1824, fd372, 0dBFEF838B8C811C17;
sub.f64 fd401, fd1823, fd1824;
mul.f64 fd402, fd372, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd403, fd366, 0dBFEF838B8C811C17, fd402;
mul.f64 fd1821, fd382, 0dBFEE11F642522D1C;
mul.f64 fd1822, fd388, 0dBFD5E3A8748A0BF5;
sub.f64 fd406, fd1821, fd1822;
mul.f64 fd407, fd388, 0dBFEE11F642522D1C;
fma.rn.f64 fd408, fd382, 0dBFD5E3A8748A0BF5, fd407;
add.f64 fd409, fd358, fd374;
add.f64 fd410, fd342, fd409;
mul.f64 fd413, fd409, 0d3FE0000000000000;
sub.f64 fd414, fd342, fd413;
add.f64 fd1820, fd1831, fd1827;
sub.f64 fd415, fd1831, fd1827;
mul.f64 fd416, fd415, 0d3FEBB67AE8584CAA;
add.f64 fd417, fd416, fd414;
sub.f64 fd418, fd414, fd416;
add.f64 fd1819, fd1836, fd1820;
mul.f64 fd419, fd1820, 0d3FE0000000000000;
sub.f64 fd420, fd1836, fd419;
sub.f64 fd421, fd358, fd374;
mul.f64 fd422, fd421, 0d3FEBB67AE8584CAA;
sub.f64 fd423, fd420, fd422;
add.f64 fd424, fd422, fd420;
add.f64 fd425, fd391, fd396;
add.f64 fd426, fd349, fd425;
mul.f64 fd429, fd425, 0d3FE0000000000000;
sub.f64 fd430, fd349, fd429;
add.f64 fd1818, fd393, fd398;
sub.f64 fd431, fd393, fd398;
mul.f64 fd432, fd431, 0d3FEBB67AE8584CAA;
add.f64 fd433, fd432, fd430;
sub.f64 fd434, fd430, fd432;
add.f64 fd1817, fd355, fd1818;
mul.f64 fd435, fd1818, 0d3FE0000000000000;
sub.f64 fd436, fd355, fd435;
sub.f64 fd437, fd391, fd396;
mul.f64 fd438, fd437, 0d3FEBB67AE8584CAA;
sub.f64 fd439, fd436, fd438;
add.f64 fd440, fd438, fd436;
add.f64 fd441, fd401, fd406;
add.f64 fd442, fd350, fd441;
mul.f64 fd445, fd441, 0d3FE0000000000000;
sub.f64 fd446, fd350, fd445;
add.f64 fd1816, fd403, fd408;
sub.f64 fd447, fd403, fd408;
mul.f64 fd448, fd447, 0d3FEBB67AE8584CAA;
add.f64 fd449, fd448, fd446;
sub.f64 fd450, fd446, fd448;
add.f64 fd1815, fd356, fd1816;
mul.f64 fd451, fd1816, 0d3FE0000000000000;
sub.f64 fd452, fd356, fd451;
sub.f64 fd453, fd401, fd406;
mul.f64 fd454, fd453, 0d3FEBB67AE8584CAA;
sub.f64 fd455, fd452, fd454;
add.f64 fd456, fd454, fd452;
mul.f64 fd458, fd1843, 0dBFCD84D223638000;
mul.f64 fd1814, fd310, 0d3FEF232EFF15C9E6;
sub.f64 fd459, fd1814, fd458;
mul.f64 fd460, fd1843, 0d3FEF232EFF15C9E6;
fma.rn.f64 fd461, fd310, 0dBFCD84D223638000, fd460;
mul.f64 fd1812, fd426, 0d3FEC98A37A9A7850;
mul.f64 fd1813, fd1817, 0dBFDCB920325BAFA6;
sub.f64 fd464, fd1812, fd1813;
mul.f64 fd465, fd1817, 0d3FEC98A37A9A7850;
fma.rn.f64 fd466, fd426, 0dBFDCB920325BAFA6, fd465;
mul.f64 fd1810, fd326, 0d3FEC98A37A9A7850;
mul.f64 fd1811, fd1841, 0dBFDCB920325BAFA6;
sub.f64 fd469, fd1810, fd1811;
mul.f64 fd470, fd1841, 0d3FEC98A37A9A7850;
fma.rn.f64 fd471, fd326, 0dBFDCB920325BAFA6, fd470;
mul.f64 fd1808, fd442, 0d3FE31BEC55BC71BC;
mul.f64 fd1809, fd1815, 0dBFE9AAFE4207DF5F;
sub.f64 fd474, fd1808, fd1809;
mul.f64 fd475, fd1815, 0d3FE31BEC55BC71BC;
fma.rn.f64 fd476, fd442, 0dBFE9AAFE4207DF5F, fd475;
mul.f64 fd1806, fd301, 0d3FE8836FA2CF5039;
mul.f64 fd1807, fd307, 0dBFE491B7523C161D;
sub.f64 fd479, fd1806, fd1807;
mul.f64 fd480, fd307, 0d3FE8836FA2CF5039;
fma.rn.f64 fd481, fd301, 0dBFE491B7523C161D, fd480;
mul.f64 fd483, fd423, 0dBFEF838B8C811C17;
mul.f64 fd1805, fd417, 0d3FC63A1A7E0B738A;
sub.f64 fd484, fd1805, fd483;
mul.f64 fd485, fd423, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd486, fd417, 0dBFEF838B8C811C17, fd485;
mul.f64 fd488, fd323, 0dBFE9AAFE4207DF5F;
mul.f64 fd1804, fd317, 0d3FE31BEC55BC71BC;
sub.f64 fd489, fd1804, fd488;
mul.f64 fd490, fd323, 0d3FE31BEC55BC71BC;
fma.rn.f64 fd491, fd317, 0dBFE9AAFE4207DF5F, fd490;
mul.f64 fd493, fd439, 0dBFEEA7D99F29CADE;
mul.f64 fd1803, fd433, 0dBFD25AFBF23865BF;
sub.f64 fd494, fd1803, fd493;
mul.f64 fd495, fd439, 0dBFD25AFBF23865BF;
fma.rn.f64 fd496, fd433, 0dBFEEA7D99F29CADE, fd495;
mul.f64 fd498, fd339, 0dBFED6206BEB6C24B;
mul.f64 fd1802, fd333, 0d3FD9595EF26FB670;
sub.f64 fd499, fd1802, fd498;
mul.f64 fd500, fd339, 0d3FD9595EF26FB670;
fma.rn.f64 fd501, fd333, 0dBFED6206BEB6C24B, fd500;
mul.f64 fd503, fd455, 0dBFE746A51650EADE;
mul.f64 fd1801, fd449, 0dBFE5F5B105F99707;
sub.f64 fd504, fd1801, fd503;
mul.f64 fd505, fd455, 0dBFE5F5B105F99707;
fma.rn.f64 fd506, fd449, 0dBFE746A51650EADE, fd505;
mul.f64 fd508, fd308, 0dBFEF838B8C811C17;
mul.f64 fd1800, fd302, 0d3FC63A1A7E0B738A;
sub.f64 fd509, fd1800, fd508;
mul.f64 fd510, fd308, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd511, fd302, 0dBFEF838B8C811C17, fd510;
mul.f64 fd1798, fd418, 0dBFEE11F642522D1C;
mul.f64 fd1799, fd424, 0dBFD5E3A8748A0BF5;
sub.f64 fd514, fd1798, fd1799;
mul.f64 fd515, fd424, 0dBFEE11F642522D1C;
fma.rn.f64 fd516, fd418, 0dBFD5E3A8748A0BF5, fd515;
mul.f64 fd1796, fd318, 0dBFADC528B5343A86;
mul.f64 fd1797, fd324, 0dBFEFF223F3635CE3;
sub.f64 fd519, fd1796, fd1797;
mul.f64 fd520, fd324, 0dBFADC528B5343A86;
fma.rn.f64 fd521, fd318, 0dBFEFF223F3635CE3, fd520;
mul.f64 fd1794, fd434, 0dBFEFC89BCEF44CF4;
mul.f64 fd1795, fd440, 0d3FBDB843E577175E;
sub.f64 fd524, fd1794, fd1795;
mul.f64 fd525, fd440, 0dBFEFC89BCEF44CF4;
fma.rn.f64 fd526, fd434, 0d3FBDB843E577175E, fd525;
mul.f64 fd528, fd340, 0dBFEEA7D99F29CADE;
mul.f64 fd1793, fd334, 0dBFD25AFBF23865BF;
sub.f64 fd529, fd1793, fd528;
mul.f64 fd530, fd340, 0dBFD25AFBF23865BF;
fma.rn.f64 fd531, fd334, 0dBFEEA7D99F29CADE, fd530;
mul.f64 fd533, fd456, 0d3FE19593DA358510;
mul.f64 fd1792, fd450, 0dBFEABC50EF4734A7;
sub.f64 fd534, fd1792, fd533;
mul.f64 fd535, fd456, 0dBFEABC50EF4734A7;
fma.rn.f64 fd536, fd450, 0d3FE19593DA358510, fd535;
add.f64 fd537, fd294, fd410;
mul.f64 fd539, fd537, 0d3FE0000000000000;
sub.f64 fd540, fd178, fd539;
add.f64 fd1791, fd1845, fd1819;
sub.f64 fd541, fd1845, fd1819;
mul.f64 fd542, fd541, 0d3FEBB67AE8584CAA;
add.f64 fd543, fd542, fd540;
sub.f64 fd544, fd540, fd542;
mul.f64 fd545, fd1791, 0d3FE0000000000000;
sub.f64 fd546, fd1872, fd545;
sub.f64 fd547, fd294, fd410;
mul.f64 fd548, fd547, 0d3FEBB67AE8584CAA;
sub.f64 fd549, fd546, fd548;
add.f64 fd550, fd548, fd546;
add.f64 fd551, fd459, fd464;
add.f64 fd552, fd194, fd551;
mul.f64 fd555, fd551, 0d3FE0000000000000;
sub.f64 fd556, fd194, fd555;
add.f64 fd1790, fd461, fd466;
sub.f64 fd557, fd461, fd466;
mul.f64 fd558, fd557, 0d3FEBB67AE8584CAA;
add.f64 fd559, fd558, fd556;
sub.f64 fd560, fd556, fd558;
add.f64 fd1789, fd1870, fd1790;
mul.f64 fd561, fd1790, 0d3FE0000000000000;
sub.f64 fd562, fd1870, fd561;
sub.f64 fd563, fd459, fd464;
mul.f64 fd564, fd563, 0d3FEBB67AE8584CAA;
sub.f64 fd565, fd562, fd564;
add.f64 fd566, fd564, fd562;
add.f64 fd567, fd469, fd474;
add.f64 fd568, fd210, fd567;
mul.f64 fd571, fd567, 0d3FE0000000000000;
sub.f64 fd572, fd210, fd571;
add.f64 fd1788, fd471, fd476;
sub.f64 fd573, fd471, fd476;
mul.f64 fd574, fd573, 0d3FEBB67AE8584CAA;
add.f64 fd575, fd574, fd572;
sub.f64 fd576, fd572, fd574;
add.f64 fd1787, fd1868, fd1788;
mul.f64 fd577, fd1788, 0d3FE0000000000000;
sub.f64 fd578, fd1868, fd577;
sub.f64 fd579, fd469, fd474;
mul.f64 fd580, fd579, 0d3FEBB67AE8584CAA;
sub.f64 fd581, fd578, fd580;
add.f64 fd582, fd580, fd578;
add.f64 fd583, fd479, fd484;
add.f64 fd584, fd185, fd583;
mul.f64 fd587, fd583, 0d3FE0000000000000;
sub.f64 fd588, fd185, fd587;
add.f64 fd1786, fd481, fd486;
sub.f64 fd589, fd481, fd486;
mul.f64 fd590, fd589, 0d3FEBB67AE8584CAA;
add.f64 fd591, fd590, fd588;
sub.f64 fd592, fd588, fd590;
add.f64 fd1785, fd191, fd1786;
mul.f64 fd593, fd1786, 0d3FE0000000000000;
sub.f64 fd594, fd191, fd593;
sub.f64 fd595, fd479, fd484;
mul.f64 fd596, fd595, 0d3FEBB67AE8584CAA;
sub.f64 fd597, fd594, fd596;
add.f64 fd598, fd596, fd594;
add.f64 fd599, fd489, fd494;
add.f64 fd600, fd201, fd599;
mul.f64 fd603, fd599, 0d3FE0000000000000;
sub.f64 fd604, fd201, fd603;
add.f64 fd1784, fd491, fd496;
sub.f64 fd605, fd491, fd496;
mul.f64 fd606, fd605, 0d3FEBB67AE8584CAA;
add.f64 fd607, fd606, fd604;
sub.f64 fd608, fd604, fd606;
add.f64 fd1783, fd207, fd1784;
mul.f64 fd609, fd1784, 0d3FE0000000000000;
sub.f64 fd610, fd207, fd609;
sub.f64 fd611, fd489, fd494;
mul.f64 fd612, fd611, 0d3FEBB67AE8584CAA;
sub.f64 fd613, fd610, fd612;
add.f64 fd614, fd612, fd610;
add.f64 fd615, fd499, fd504;
add.f64 fd616, fd217, fd615;
mul.f64 fd619, fd615, 0d3FE0000000000000;
sub.f64 fd620, fd217, fd619;
add.f64 fd1782, fd501, fd506;
sub.f64 fd621, fd501, fd506;
mul.f64 fd622, fd621, 0d3FEBB67AE8584CAA;
add.f64 fd623, fd622, fd620;
sub.f64 fd624, fd620, fd622;
add.f64 fd1781, fd223, fd1782;
mul.f64 fd625, fd1782, 0d3FE0000000000000;
sub.f64 fd626, fd223, fd625;
sub.f64 fd627, fd499, fd504;
mul.f64 fd628, fd627, 0d3FEBB67AE8584CAA;
sub.f64 fd629, fd626, fd628;
add.f64 fd630, fd628, fd626;
add.f64 fd631, fd509, fd514;
add.f64 fd632, fd186, fd631;
mul.f64 fd635, fd631, 0d3FE0000000000000;
sub.f64 fd636, fd186, fd635;
add.f64 fd1780, fd511, fd516;
sub.f64 fd637, fd511, fd516;
mul.f64 fd638, fd637, 0d3FEBB67AE8584CAA;
add.f64 fd639, fd638, fd636;
sub.f64 fd640, fd636, fd638;
add.f64 fd1779, fd192, fd1780;
mul.f64 fd641, fd1780, 0d3FE0000000000000;
sub.f64 fd642, fd192, fd641;
sub.f64 fd643, fd509, fd514;
mul.f64 fd644, fd643, 0d3FEBB67AE8584CAA;
sub.f64 fd645, fd642, fd644;
add.f64 fd646, fd644, fd642;
add.f64 fd647, fd519, fd524;
add.f64 fd648, fd202, fd647;
mul.f64 fd651, fd647, 0d3FE0000000000000;
sub.f64 fd652, fd202, fd651;
add.f64 fd1778, fd521, fd526;
sub.f64 fd653, fd521, fd526;
mul.f64 fd654, fd653, 0d3FEBB67AE8584CAA;
add.f64 fd655, fd654, fd652;
sub.f64 fd656, fd652, fd654;
add.f64 fd1777, fd208, fd1778;
mul.f64 fd657, fd1778, 0d3FE0000000000000;
sub.f64 fd658, fd208, fd657;
sub.f64 fd659, fd519, fd524;
mul.f64 fd660, fd659, 0d3FEBB67AE8584CAA;
sub.f64 fd661, fd658, fd660;
add.f64 fd662, fd660, fd658;
add.f64 fd663, fd529, fd534;
add.f64 fd664, fd218, fd663;
mul.f64 fd667, fd663, 0d3FE0000000000000;
sub.f64 fd668, fd218, fd667;
add.f64 fd1776, fd531, fd536;
sub.f64 fd669, fd531, fd536;
mul.f64 fd670, fd669, 0d3FEBB67AE8584CAA;
add.f64 fd671, fd670, fd668;
sub.f64 fd672, fd668, fd670;
add.f64 fd1775, fd224, fd1776;
mul.f64 fd673, fd1776, 0d3FE0000000000000;
sub.f64 fd674, fd224, fd673;
sub.f64 fd675, fd529, fd534;
mul.f64 fd676, fd675, 0d3FEBB67AE8584CAA;
sub.f64 fd677, fd674, fd676;
add.f64 fd678, fd676, fd674;
mov.u32 r15, %tid.x;
mul.wide.u32 rd2, r15, 795364315;
shr.u64 rd3, rd2, 32;
cvt.u32.u64 r5, rd3;
sub.s32 r6, r15, r5;
shr.u32 r7, r6, 1;
add.s32 r8, r7, r5;
shr.u32 r9, r8, 4;
mul.lo.s32 r10, r9, 27;
sub.s32 r11, r15, r10;
mad.lo.s32 r12, r9, 11664, r3;
mov.u64 rd5, %55;
mul.wide.u32 rd7, r11, 16;
add.s64 rd6, rd5, rd7;
ld.global.v2.f64 {fd679, fd680}, [rd6];
mul.f64 fd684, fd680, fd1789;
mul.f64 fd685, fd679, fd1789;
mul.f64 fd687, fd680, fd680;
mul.f64 fd1774, fd679, fd679;
sub.f64 fd688, fd1774, fd687;
mul.f64 fd689, fd680, fd679;
fma.rn.f64 fd690, fd680, fd679, fd689;
mul.f64 fd692, fd690, fd1787;
mul.f64 fd693, fd688, fd1787;
mul.f64 fd1772, fd679, fd688;
mul.f64 fd1773, fd680, fd690;
sub.f64 fd696, fd1772, fd1773;
mul.f64 fd1771, fd688, fd568;
mul.f64 fd697, fd679, fd690;
fma.rn.f64 fd698, fd680, fd688, fd697;
mul.f64 fd700, fd698, fd1785;
mul.f64 fd701, fd696, fd1785;
mul.f64 fd703, fd680, fd698;
mul.f64 fd1770, fd679, fd696;
sub.f64 fd704, fd1770, fd703;
mul.f64 fd1769, fd696, fd584;
mul.f64 fd705, fd679, fd698;
fma.rn.f64 fd706, fd680, fd696, fd705;
mul.f64 fd708, fd706, fd1783;
mul.f64 fd709, fd704, fd1783;
mul.f64 fd1767, fd679, fd704;
mul.f64 fd1768, fd680, fd706;
sub.f64 fd712, fd1767, fd1768;
mul.f64 fd1766, fd704, fd600;
mul.f64 fd713, fd679, fd706;
fma.rn.f64 fd714, fd680, fd704, fd713;
mul.f64 fd716, fd714, fd1781;
mul.f64 fd717, fd712, fd1781;
mul.f64 fd719, fd680, fd714;
mul.f64 fd1765, fd679, fd712;
sub.f64 fd720, fd1765, fd719;
mul.f64 fd1764, fd712, fd616;
mul.f64 fd721, fd679, fd714;
fma.rn.f64 fd722, fd680, fd712, fd721;
mul.f64 fd724, fd722, fd1779;
mul.f64 fd725, fd720, fd1779;
mul.f64 fd727, fd680, fd722;
mul.f64 fd1763, fd679, fd720;
sub.f64 fd728, fd1763, fd727;
mul.f64 fd1762, fd720, fd632;
mul.f64 fd729, fd679, fd722;
fma.rn.f64 fd730, fd680, fd720, fd729;
mul.f64 fd732, fd730, fd1777;
mul.f64 fd733, fd728, fd1777;
mul.f64 fd1760, fd679, fd728;
mul.f64 fd1761, fd680, fd730;
sub.f64 fd736, fd1760, fd1761;
mul.f64 fd1759, fd728, fd648;
mul.f64 fd737, fd679, fd730;
fma.rn.f64 fd738, fd680, fd728, fd737;
mul.f64 fd740, fd738, fd1775;
mul.f64 fd741, fd736, fd1775;
mul.f64 fd743, fd680, fd738;
mul.f64 fd1758, fd679, fd736;
sub.f64 fd744, fd1758, fd743;
mul.f64 fd1757, fd736, fd664;
mul.f64 fd745, fd679, fd738;
fma.rn.f64 fd746, fd680, fd736, fd745;
mul.f64 fd748, fd746, fd549;
mul.f64 fd749, fd744, fd549;
mul.f64 fd751, fd680, fd746;
mul.f64 fd1756, fd679, fd744;
sub.f64 fd752, fd1756, fd751;
mul.f64 fd1755, fd744, fd543;
mul.f64 fd753, fd679, fd746;
fma.rn.f64 fd754, fd680, fd744, fd753;
mul.f64 fd756, fd754, fd565;
mul.f64 fd757, fd752, fd565;
mul.f64 fd1753, fd679, fd752;
mul.f64 fd1754, fd680, fd754;
sub.f64 fd760, fd1753, fd1754;
mul.f64 fd1752, fd752, fd559;
mul.f64 fd761, fd679, fd754;
fma.rn.f64 fd762, fd680, fd752, fd761;
mul.f64 fd764, fd762, fd581;
mul.f64 fd765, fd760, fd581;
mul.f64 fd767, fd680, fd762;
mul.f64 fd1751, fd679, fd760;
sub.f64 fd768, fd1751, fd767;
mul.f64 fd1750, fd760, fd575;
mul.f64 fd769, fd679, fd762;
fma.rn.f64 fd770, fd680, fd760, fd769;
mul.f64 fd772, fd770, fd597;
mul.f64 fd773, fd768, fd597;
mul.f64 fd1748, fd679, fd768;
mul.f64 fd1749, fd680, fd770;
sub.f64 fd776, fd1748, fd1749;
mul.f64 fd1747, fd768, fd591;
mul.f64 fd777, fd679, fd770;
fma.rn.f64 fd778, fd680, fd768, fd777;
mul.f64 fd779, fd776, fd607;
mul.f64 fd780, fd778, fd613;
mul.f64 fd781, fd776, fd613;
ld.global.v2.f64 {fd782, fd783}, [rd6+432];
mul.f64 fd787, fd783, fd629;
mul.f64 fd788, fd782, fd629;
mul.f64 fd790, fd680, fd783;
mul.f64 fd1746, fd679, fd782;
sub.f64 fd791, fd1746, fd790;
mul.f64 fd1745, fd782, fd623;
mul.f64 fd792, fd679, fd783;
fma.rn.f64 fd793, fd680, fd782, fd792;
mul.f64 fd795, fd793, fd645;
mul.f64 fd796, fd791, fd645;
mul.f64 fd798, fd680, fd793;
mul.f64 fd1744, fd679, fd791;
sub.f64 fd799, fd1744, fd798;
mul.f64 fd1743, fd791, fd639;
mul.f64 fd800, fd679, fd793;
fma.rn.f64 fd801, fd680, fd791, fd800;
mul.f64 fd803, fd801, fd661;
mul.f64 fd804, fd799, fd661;
mul.f64 fd1741, fd679, fd799;
mul.f64 fd1742, fd680, fd801;
sub.f64 fd807, fd1741, fd1742;
mul.f64 fd1740, fd799, fd655;
mul.f64 fd808, fd679, fd801;
fma.rn.f64 fd809, fd680, fd799, fd808;
mul.f64 fd811, fd809, fd677;
mul.f64 fd812, fd807, fd677;
mul.f64 fd814, fd680, fd809;
mul.f64 fd1739, fd679, fd807;
sub.f64 fd815, fd1739, fd814;
mul.f64 fd1738, fd807, fd671;
mul.f64 fd816, fd679, fd809;
fma.rn.f64 fd817, fd680, fd807, fd816;
mul.f64 fd819, fd817, fd550;
mul.f64 fd820, fd815, fd550;
mul.f64 fd822, fd680, fd817;
mul.f64 fd1737, fd679, fd815;
sub.f64 fd823, fd1737, fd822;
mul.f64 fd1736, fd815, fd544;
mul.f64 fd824, fd679, fd817;
fma.rn.f64 fd825, fd680, fd815, fd824;
mul.f64 fd827, fd825, fd566;
mul.f64 fd828, fd823, fd566;
mul.f64 fd1734, fd679, fd823;
mul.f64 fd1735, fd680, fd825;
sub.f64 fd831, fd1734, fd1735;
mul.f64 fd1733, fd823, fd560;
mul.f64 fd832, fd679, fd825;
fma.rn.f64 fd833, fd680, fd823, fd832;
mul.f64 fd835, fd833, fd582;
mul.f64 fd836, fd831, fd582;
mul.f64 fd838, fd680, fd833;
mul.f64 fd1732, fd679, fd831;
sub.f64 fd839, fd1732, fd838;
mul.f64 fd1731, fd831, fd576;
mul.f64 fd840, fd679, fd833;
fma.rn.f64 fd841, fd680, fd831, fd840;
mul.f64 fd843, fd841, fd598;
mul.f64 fd844, fd839, fd598;
mul.f64 fd1729, fd679, fd839;
mul.f64 fd1730, fd680, fd841;
sub.f64 fd847, fd1729, fd1730;
mul.f64 fd1728, fd839, fd592;
mul.f64 fd848, fd679, fd841;
fma.rn.f64 fd849, fd680, fd839, fd848;
mul.f64 fd851, fd849, fd614;
mul.f64 fd852, fd847, fd614;
mul.f64 fd854, fd680, fd849;
mul.f64 fd1727, fd679, fd847;
sub.f64 fd855, fd1727, fd854;
mul.f64 fd1726, fd847, fd608;
mul.f64 fd856, fd679, fd849;
fma.rn.f64 fd857, fd680, fd847, fd856;
mul.f64 fd859, fd857, fd630;
mul.f64 fd860, fd855, fd630;
mul.f64 fd862, fd680, fd857;
mul.f64 fd1725, fd679, fd855;
sub.f64 fd863, fd1725, fd862;
mul.f64 fd1724, fd855, fd624;
mul.f64 fd864, fd679, fd857;
fma.rn.f64 fd865, fd680, fd855, fd864;
mul.f64 fd867, fd865, fd646;
mul.f64 fd868, fd863, fd646;
mul.f64 fd1722, fd679, fd863;
mul.f64 fd1723, fd680, fd865;
sub.f64 fd871, fd1722, fd1723;
mul.f64 fd1721, fd863, fd640;
mul.f64 fd872, fd679, fd865;
fma.rn.f64 fd873, fd680, fd863, fd872;
mul.f64 fd875, fd873, fd662;
mul.f64 fd876, fd871, fd662;
mul.f64 fd878, fd680, fd873;
mul.f64 fd1720, fd679, fd871;
sub.f64 fd879, fd1720, fd878;
mul.f64 fd1719, fd679, fd552;
mul.f64 fd880, fd679, fd873;
mul.f64 fd1718, fd871, fd656;
fma.rn.f64 fd881, fd680, fd871, fd880;
mul.f64 fd882, fd879, fd672;
mul.f64 fd883, fd881, fd678;
mul.f64 fd884, fd879, fd678;
barrier.sync 0;
mad.lo.s32 r13, r11, 432, r12;
add.f64 fd885, fd1872, fd1791;
add.f64 fd886, fd178, fd537;
st.shared.v2.f64 [r13], {fd886, fd885};
fma.rn.f64 fd887, fd680, fd552, fd685;
sub.f64 fd888, fd1719, fd684;
st.shared.v2.f64 [r13+16], {fd888, fd887};
fma.rn.f64 fd889, fd690, fd568, fd693;
sub.f64 fd890, fd1771, fd692;
st.shared.v2.f64 [r13+32], {fd890, fd889};
fma.rn.f64 fd891, fd698, fd584, fd701;
sub.f64 fd892, fd1769, fd700;
st.shared.v2.f64 [r13+48], {fd892, fd891};
fma.rn.f64 fd893, fd706, fd600, fd709;
sub.f64 fd894, fd1766, fd708;
st.shared.v2.f64 [r13+64], {fd894, fd893};
fma.rn.f64 fd895, fd714, fd616, fd717;
sub.f64 fd896, fd1764, fd716;
st.shared.v2.f64 [r13+80], {fd896, fd895};
fma.rn.f64 fd897, fd722, fd632, fd725;
sub.f64 fd898, fd1762, fd724;
st.shared.v2.f64 [r13+96], {fd898, fd897};
sub.f64 fd899, fd1759, fd732;
fma.rn.f64 fd900, fd730, fd648, fd733;
st.shared.v2.f64 [r13+112], {fd899, fd900};
fma.rn.f64 fd901, fd738, fd664, fd741;
sub.f64 fd902, fd1757, fd740;
st.shared.v2.f64 [r13+128], {fd902, fd901};
fma.rn.f64 fd903, fd746, fd543, fd749;
sub.f64 fd904, fd1755, fd748;
st.shared.v2.f64 [r13+144], {fd904, fd903};
fma.rn.f64 fd905, fd754, fd559, fd757;
sub.f64 fd906, fd1752, fd756;
st.shared.v2.f64 [r13+160], {fd906, fd905};
fma.rn.f64 fd907, fd762, fd575, fd765;
sub.f64 fd908, fd1750, fd764;
st.shared.v2.f64 [r13+176], {fd908, fd907};
fma.rn.f64 fd909, fd770, fd591, fd773;
sub.f64 fd910, fd1747, fd772;
st.shared.v2.f64 [r13+192], {fd910, fd909};
fma.rn.f64 fd911, fd778, fd607, fd781;
sub.f64 fd912, fd779, fd780;
st.shared.v2.f64 [r13+208], {fd912, fd911};
fma.rn.f64 fd913, fd783, fd623, fd788;
sub.f64 fd914, fd1745, fd787;
st.shared.v2.f64 [r13+224], {fd914, fd913};
fma.rn.f64 fd915, fd793, fd639, fd796;
sub.f64 fd916, fd1743, fd795;
st.shared.v2.f64 [r13+240], {fd916, fd915};
fma.rn.f64 fd917, fd801, fd655, fd804;
sub.f64 fd918, fd1740, fd803;
st.shared.v2.f64 [r13+256], {fd918, fd917};
fma.rn.f64 fd919, fd809, fd671, fd812;
sub.f64 fd920, fd1738, fd811;
st.shared.v2.f64 [r13+272], {fd920, fd919};
fma.rn.f64 fd921, fd817, fd544, fd820;
sub.f64 fd922, fd1736, fd819;
st.shared.v2.f64 [r13+288], {fd922, fd921};
fma.rn.f64 fd923, fd825, fd560, fd828;
sub.f64 fd924, fd1733, fd827;
st.shared.v2.f64 [r13+304], {fd924, fd923};
sub.f64 fd925, fd1731, fd835;
fma.rn.f64 fd926, fd833, fd576, fd836;
st.shared.v2.f64 [r13+320], {fd925, fd926};
fma.rn.f64 fd927, fd841, fd592, fd844;
sub.f64 fd928, fd1728, fd843;
st.shared.v2.f64 [r13+336], {fd928, fd927};
fma.rn.f64 fd929, fd849, fd608, fd852;
sub.f64 fd930, fd1726, fd851;
st.shared.v2.f64 [r13+352], {fd930, fd929};
fma.rn.f64 fd931, fd857, fd624, fd860;
sub.f64 fd932, fd1724, fd859;
st.shared.v2.f64 [r13+368], {fd932, fd931};
fma.rn.f64 fd933, fd865, fd640, fd868;
sub.f64 fd934, fd1721, fd867;
st.shared.v2.f64 [r13+384], {fd934, fd933};
fma.rn.f64 fd935, fd873, fd656, fd876;
sub.f64 fd936, fd1718, fd875;
st.shared.v2.f64 [r13+400], {fd936, fd935};
fma.rn.f64 fd937, fd881, fd672, fd884;
sub.f64 fd938, fd882, fd883;
st.shared.v2.f64 [r13+416], {fd938, fd937};
barrier.sync 0;
mad.lo.s32 r14, r11, -416, r13;
ld.shared.v2.f64 {fd939, fd940}, [r14];
ld.shared.v2.f64 {fd943, fd944}, [r14+432];
ld.shared.v2.f64 {fd947, fd948}, [r14+864];
ld.shared.v2.f64 {fd951, fd952}, [r14+1296];
ld.shared.v2.f64 {fd955, fd956}, [r14+1728];
ld.shared.v2.f64 {fd959, fd960}, [r14+2160];
ld.shared.v2.f64 {fd963, fd964}, [r14+2592];
ld.shared.v2.f64 {fd967, fd968}, [r14+3024];
ld.shared.v2.f64 {fd971, fd972}, [r14+3456];
ld.shared.v2.f64 {fd975, fd976}, [r14+3888];
ld.shared.v2.f64 {fd979, fd980}, [r14+4320];
ld.shared.v2.f64 {fd983, fd984}, [r14+4752];
ld.shared.v2.f64 {fd987, fd988}, [r14+5184];
ld.shared.v2.f64 {fd991, fd992}, [r14+5616];
ld.shared.v2.f64 {fd995, fd996}, [r14+6048];
ld.shared.v2.f64 {fd999, fd1000}, [r14+6480];
ld.shared.v2.f64 {fd1003, fd1004}, [r14+6912];
ld.shared.v2.f64 {fd1007, fd1008}, [r14+7344];
ld.shared.v2.f64 {fd1011, fd1012}, [r14+7776];
ld.shared.v2.f64 {fd1015, fd1016}, [r14+8208];
ld.shared.v2.f64 {fd1019, fd1020}, [r14+8640];
ld.shared.v2.f64 {fd1023, fd1024}, [r14+9072];
ld.shared.v2.f64 {fd1027, fd1028}, [r14+9504];
ld.shared.v2.f64 {fd1031, fd1032}, [r14+9936];
ld.shared.v2.f64 {fd1035, fd1036}, [r14+10368];
ld.shared.v2.f64 {fd1039, fd1040}, [r14+10800];
ld.shared.v2.f64 {fd1043, fd1044}, [r14+11232];
add.f64 fd1047, fd975, fd1011;
add.f64 fd1048, fd939, fd1047;
mul.f64 fd1051, fd1047, 0d3FE0000000000000;
sub.f64 fd1052, fd939, fd1051;
add.f64 fd1717, fd976, fd1012;
sub.f64 fd1053, fd976, fd1012;
mul.f64 fd1054, fd1053, 0d3FEBB67AE8584CAA;
add.f64 fd1055, fd1054, fd1052;
sub.f64 fd1056, fd1052, fd1054;
add.f64 fd1716, fd940, fd1717;
mul.f64 fd1057, fd1717, 0d3FE0000000000000;
sub.f64 fd1058, fd940, fd1057;
sub.f64 fd1059, fd975, fd1011;
mul.f64 fd1060, fd1059, 0d3FEBB67AE8584CAA;
sub.f64 fd1061, fd1058, fd1060;
add.f64 fd1062, fd1060, fd1058;
add.f64 fd1063, fd987, fd1023;
add.f64 fd1064, fd951, fd1063;
mul.f64 fd1067, fd1063, 0d3FE0000000000000;
sub.f64 fd1068, fd951, fd1067;
add.f64 fd1715, fd988, fd1024;
sub.f64 fd1069, fd988, fd1024;
mul.f64 fd1070, fd1069, 0d3FEBB67AE8584CAA;
add.f64 fd1071, fd1070, fd1068;
sub.f64 fd1072, fd1068, fd1070;
add.f64 fd1714, fd952, fd1715;
mul.f64 fd1073, fd1715, 0d3FE0000000000000;
sub.f64 fd1074, fd952, fd1073;
sub.f64 fd1075, fd987, fd1023;
mul.f64 fd1076, fd1075, 0d3FEBB67AE8584CAA;
sub.f64 fd1077, fd1074, fd1076;
add.f64 fd1078, fd1076, fd1074;
add.f64 fd1079, fd999, fd1035;
add.f64 fd1080, fd963, fd1079;
mul.f64 fd1083, fd1079, 0d3FE0000000000000;
sub.f64 fd1084, fd963, fd1083;
add.f64 fd1713, fd1000, fd1036;
sub.f64 fd1085, fd1000, fd1036;
mul.f64 fd1086, fd1085, 0d3FEBB67AE8584CAA;
add.f64 fd1087, fd1086, fd1084;
sub.f64 fd1088, fd1084, fd1086;
add.f64 fd1712, fd964, fd1713;
mul.f64 fd1089, fd1713, 0d3FE0000000000000;
sub.f64 fd1090, fd964, fd1089;
sub.f64 fd1091, fd999, fd1035;
mul.f64 fd1092, fd1091, 0d3FEBB67AE8584CAA;
sub.f64 fd1093, fd1090, fd1092;
add.f64 fd1094, fd1092, fd1090;
mul.f64 fd1710, fd1071, 0d3FE8836FA2CF5039;
mul.f64 fd1711, fd1077, 0dBFE491B7523C161D;
sub.f64 fd1097, fd1710, fd1711;
mul.f64 fd1098, fd1077, 0d3FE8836FA2CF5039;
fma.rn.f64 fd1099, fd1071, 0dBFE491B7523C161D, fd1098;
mul.f64 fd1101, fd1093, 0dBFEF838B8C811C17;
mul.f64 fd1709, fd1087, 0d3FC63A1A7E0B738A;
sub.f64 fd1102, fd1709, fd1101;
mul.f64 fd1103, fd1093, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd1104, fd1087, 0dBFEF838B8C811C17, fd1103;
mul.f64 fd1106, fd1078, 0dBFEF838B8C811C17;
mul.f64 fd1708, fd1072, 0d3FC63A1A7E0B738A;
sub.f64 fd1107, fd1708, fd1106;
mul.f64 fd1108, fd1078, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd1109, fd1072, 0dBFEF838B8C811C17, fd1108;
mul.f64 fd1111, fd1094, 0dBFD5E3A8748A0BF5;
mul.f64 fd1707, fd1088, 0dBFEE11F642522D1C;
sub.f64 fd1112, fd1707, fd1111;
mul.f64 fd1113, fd1094, 0dBFEE11F642522D1C;
fma.rn.f64 fd1114, fd1088, 0dBFD5E3A8748A0BF5, fd1113;
add.f64 fd1115, fd1064, fd1080;
add.f64 fd1116, fd1048, fd1115;
mul.f64 fd1119, fd1115, 0d3FE0000000000000;
sub.f64 fd1120, fd1048, fd1119;
add.f64 fd1706, fd1714, fd1712;
sub.f64 fd1121, fd1714, fd1712;
mul.f64 fd1122, fd1121, 0d3FEBB67AE8584CAA;
add.f64 fd1123, fd1122, fd1120;
sub.f64 fd1124, fd1120, fd1122;
add.f64 fd1705, fd1716, fd1706;
mul.f64 fd1125, fd1706, 0d3FE0000000000000;
sub.f64 fd1126, fd1716, fd1125;
sub.f64 fd1127, fd1064, fd1080;
mul.f64 fd1128, fd1127, 0d3FEBB67AE8584CAA;
sub.f64 fd1129, fd1126, fd1128;
add.f64 fd1130, fd1128, fd1126;
add.f64 fd1131, fd1097, fd1102;
add.f64 fd1132, fd1055, fd1131;
mul.f64 fd1135, fd1131, 0d3FE0000000000000;
sub.f64 fd1136, fd1055, fd1135;
add.f64 fd1704, fd1099, fd1104;
sub.f64 fd1137, fd1099, fd1104;
mul.f64 fd1138, fd1137, 0d3FEBB67AE8584CAA;
add.f64 fd1139, fd1138, fd1136;
sub.f64 fd1140, fd1136, fd1138;
add.f64 fd1703, fd1061, fd1704;
mul.f64 fd1141, fd1704, 0d3FE0000000000000;
sub.f64 fd1142, fd1061, fd1141;
sub.f64 fd1143, fd1097, fd1102;
mul.f64 fd1144, fd1143, 0d3FEBB67AE8584CAA;
sub.f64 fd1145, fd1142, fd1144;
add.f64 fd1146, fd1144, fd1142;
add.f64 fd1147, fd1107, fd1112;
add.f64 fd1148, fd1056, fd1147;
mul.f64 fd1151, fd1147, 0d3FE0000000000000;
sub.f64 fd1152, fd1056, fd1151;
add.f64 fd1702, fd1109, fd1114;
sub.f64 fd1153, fd1109, fd1114;
mul.f64 fd1154, fd1153, 0d3FEBB67AE8584CAA;
add.f64 fd1155, fd1154, fd1152;
sub.f64 fd1156, fd1152, fd1154;
add.f64 fd1701, fd1062, fd1702;
mul.f64 fd1157, fd1702, 0d3FE0000000000000;
sub.f64 fd1158, fd1062, fd1157;
sub.f64 fd1159, fd1107, fd1112;
mul.f64 fd1160, fd1159, 0d3FEBB67AE8584CAA;
sub.f64 fd1161, fd1158, fd1160;
add.f64 fd1162, fd1160, fd1158;
add.f64 fd1163, fd979, fd1015;
add.f64 fd1164, fd943, fd1163;
mul.f64 fd1167, fd1163, 0d3FE0000000000000;
sub.f64 fd1168, fd943, fd1167;
add.f64 fd1700, fd980, fd1016;
sub.f64 fd1169, fd980, fd1016;
mul.f64 fd1170, fd1169, 0d3FEBB67AE8584CAA;
add.f64 fd1171, fd1170, fd1168;
sub.f64 fd1172, fd1168, fd1170;
add.f64 fd1699, fd944, fd1700;
mul.f64 fd1173, fd1700, 0d3FE0000000000000;
sub.f64 fd1174, fd944, fd1173;
sub.f64 fd1175, fd979, fd1015;
mul.f64 fd1176, fd1175, 0d3FEBB67AE8584CAA;
sub.f64 fd1177, fd1174, fd1176;
add.f64 fd1178, fd1176, fd1174;
add.f64 fd1179, fd991, fd1027;
add.f64 fd1180, fd955, fd1179;
mul.f64 fd1183, fd1179, 0d3FE0000000000000;
sub.f64 fd1184, fd955, fd1183;
add.f64 fd1698, fd992, fd1028;
sub.f64 fd1185, fd992, fd1028;
mul.f64 fd1186, fd1185, 0d3FEBB67AE8584CAA;
add.f64 fd1187, fd1186, fd1184;
sub.f64 fd1188, fd1184, fd1186;
add.f64 fd1697, fd956, fd1698;
mul.f64 fd1189, fd1698, 0d3FE0000000000000;
sub.f64 fd1190, fd956, fd1189;
sub.f64 fd1191, fd991, fd1027;
mul.f64 fd1192, fd1191, 0d3FEBB67AE8584CAA;
sub.f64 fd1193, fd1190, fd1192;
add.f64 fd1194, fd1192, fd1190;
add.f64 fd1195, fd1003, fd1039;
add.f64 fd1196, fd967, fd1195;
mul.f64 fd1199, fd1195, 0d3FE0000000000000;
sub.f64 fd1200, fd967, fd1199;
add.f64 fd1696, fd1004, fd1040;
sub.f64 fd1201, fd1004, fd1040;
mul.f64 fd1202, fd1201, 0d3FEBB67AE8584CAA;
add.f64 fd1203, fd1202, fd1200;
sub.f64 fd1204, fd1200, fd1202;
add.f64 fd1695, fd968, fd1696;
mul.f64 fd1205, fd1696, 0d3FE0000000000000;
sub.f64 fd1206, fd968, fd1205;
sub.f64 fd1207, fd1003, fd1039;
mul.f64 fd1208, fd1207, 0d3FEBB67AE8584CAA;
sub.f64 fd1209, fd1206, fd1208;
add.f64 fd1210, fd1208, fd1206;
mul.f64 fd1693, fd1187, 0d3FE8836FA2CF5039;
mul.f64 fd1694, fd1193, 0dBFE491B7523C161D;
sub.f64 fd1213, fd1693, fd1694;
mul.f64 fd1214, fd1193, 0d3FE8836FA2CF5039;
fma.rn.f64 fd1215, fd1187, 0dBFE491B7523C161D, fd1214;
mul.f64 fd1217, fd1209, 0dBFEF838B8C811C17;
mul.f64 fd1692, fd1203, 0d3FC63A1A7E0B738A;
sub.f64 fd1218, fd1692, fd1217;
mul.f64 fd1219, fd1209, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd1220, fd1203, 0dBFEF838B8C811C17, fd1219;
mul.f64 fd1222, fd1194, 0dBFEF838B8C811C17;
mul.f64 fd1691, fd1188, 0d3FC63A1A7E0B738A;
sub.f64 fd1223, fd1691, fd1222;
mul.f64 fd1224, fd1194, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd1225, fd1188, 0dBFEF838B8C811C17, fd1224;
mul.f64 fd1227, fd1210, 0dBFD5E3A8748A0BF5;
mul.f64 fd1690, fd1204, 0dBFEE11F642522D1C;
sub.f64 fd1228, fd1690, fd1227;
mul.f64 fd1229, fd1210, 0dBFEE11F642522D1C;
fma.rn.f64 fd1230, fd1204, 0dBFD5E3A8748A0BF5, fd1229;
add.f64 fd1231, fd1180, fd1196;
add.f64 fd1232, fd1164, fd1231;
mul.f64 fd1235, fd1231, 0d3FE0000000000000;
sub.f64 fd1236, fd1164, fd1235;
add.f64 fd1689, fd1697, fd1695;
sub.f64 fd1237, fd1697, fd1695;
mul.f64 fd1238, fd1237, 0d3FEBB67AE8584CAA;
add.f64 fd1239, fd1238, fd1236;
sub.f64 fd1240, fd1236, fd1238;
add.f64 fd1688, fd1699, fd1689;
mul.f64 fd1241, fd1689, 0d3FE0000000000000;
sub.f64 fd1242, fd1699, fd1241;
sub.f64 fd1243, fd1180, fd1196;
mul.f64 fd1244, fd1243, 0d3FEBB67AE8584CAA;
sub.f64 fd1245, fd1242, fd1244;
add.f64 fd1246, fd1244, fd1242;
add.f64 fd1247, fd1213, fd1218;
add.f64 fd1248, fd1171, fd1247;
mul.f64 fd1251, fd1247, 0d3FE0000000000000;
sub.f64 fd1252, fd1171, fd1251;
add.f64 fd1687, fd1215, fd1220;
sub.f64 fd1253, fd1215, fd1220;
mul.f64 fd1254, fd1253, 0d3FEBB67AE8584CAA;
add.f64 fd1255, fd1254, fd1252;
sub.f64 fd1256, fd1252, fd1254;
add.f64 fd1686, fd1177, fd1687;
mul.f64 fd1257, fd1687, 0d3FE0000000000000;
sub.f64 fd1258, fd1177, fd1257;
sub.f64 fd1259, fd1213, fd1218;
mul.f64 fd1260, fd1259, 0d3FEBB67AE8584CAA;
sub.f64 fd1261, fd1258, fd1260;
add.f64 fd1262, fd1260, fd1258;
add.f64 fd1263, fd1223, fd1228;
add.f64 fd1264, fd1172, fd1263;
mul.f64 fd1267, fd1263, 0d3FE0000000000000;
sub.f64 fd1268, fd1172, fd1267;
add.f64 fd1685, fd1225, fd1230;
sub.f64 fd1269, fd1225, fd1230;
mul.f64 fd1270, fd1269, 0d3FEBB67AE8584CAA;
add.f64 fd1271, fd1270, fd1268;
sub.f64 fd1272, fd1268, fd1270;
add.f64 fd1684, fd1178, fd1685;
mul.f64 fd1273, fd1685, 0d3FE0000000000000;
sub.f64 fd1274, fd1178, fd1273;
sub.f64 fd1275, fd1223, fd1228;
mul.f64 fd1276, fd1275, 0d3FEBB67AE8584CAA;
sub.f64 fd1277, fd1274, fd1276;
add.f64 fd1278, fd1276, fd1274;
add.f64 fd1279, fd983, fd1019;
add.f64 fd1280, fd947, fd1279;
mul.f64 fd1283, fd1279, 0d3FE0000000000000;
sub.f64 fd1284, fd947, fd1283;
add.f64 fd1683, fd984, fd1020;
sub.f64 fd1285, fd984, fd1020;
mul.f64 fd1286, fd1285, 0d3FEBB67AE8584CAA;
add.f64 fd1287, fd1286, fd1284;
sub.f64 fd1288, fd1284, fd1286;
add.f64 fd1682, fd948, fd1683;
mul.f64 fd1289, fd1683, 0d3FE0000000000000;
sub.f64 fd1290, fd948, fd1289;
sub.f64 fd1291, fd983, fd1019;
mul.f64 fd1292, fd1291, 0d3FEBB67AE8584CAA;
sub.f64 fd1293, fd1290, fd1292;
add.f64 fd1294, fd1292, fd1290;
add.f64 fd1295, fd995, fd1031;
add.f64 fd1296, fd959, fd1295;
mul.f64 fd1299, fd1295, 0d3FE0000000000000;
sub.f64 fd1300, fd959, fd1299;
add.f64 fd1681, fd996, fd1032;
sub.f64 fd1301, fd996, fd1032;
mul.f64 fd1302, fd1301, 0d3FEBB67AE8584CAA;
add.f64 fd1303, fd1302, fd1300;
sub.f64 fd1304, fd1300, fd1302;
add.f64 fd1680, fd960, fd1681;
mul.f64 fd1305, fd1681, 0d3FE0000000000000;
sub.f64 fd1306, fd960, fd1305;
sub.f64 fd1307, fd995, fd1031;
mul.f64 fd1308, fd1307, 0d3FEBB67AE8584CAA;
sub.f64 fd1309, fd1306, fd1308;
add.f64 fd1310, fd1308, fd1306;
add.f64 fd1311, fd1007, fd1043;
add.f64 fd1312, fd971, fd1311;
mul.f64 fd1315, fd1311, 0d3FE0000000000000;
sub.f64 fd1316, fd971, fd1315;
add.f64 fd1679, fd1008, fd1044;
sub.f64 fd1317, fd1008, fd1044;
mul.f64 fd1318, fd1317, 0d3FEBB67AE8584CAA;
add.f64 fd1319, fd1318, fd1316;
sub.f64 fd1320, fd1316, fd1318;
add.f64 fd1678, fd972, fd1679;
mul.f64 fd1321, fd1679, 0d3FE0000000000000;
sub.f64 fd1322, fd972, fd1321;
sub.f64 fd1323, fd1007, fd1043;
mul.f64 fd1324, fd1323, 0d3FEBB67AE8584CAA;
sub.f64 fd1325, fd1322, fd1324;
add.f64 fd1326, fd1324, fd1322;
mul.f64 fd1676, fd1303, 0d3FE8836FA2CF5039;
mul.f64 fd1677, fd1309, 0dBFE491B7523C161D;
sub.f64 fd1329, fd1676, fd1677;
mul.f64 fd1330, fd1309, 0d3FE8836FA2CF5039;
fma.rn.f64 fd1331, fd1303, 0dBFE491B7523C161D, fd1330;
mul.f64 fd1674, fd1319, 0d3FC63A1A7E0B738A;
mul.f64 fd1675, fd1325, 0dBFEF838B8C811C17;
sub.f64 fd1334, fd1674, fd1675;
mul.f64 fd1335, fd1325, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd1336, fd1319, 0dBFEF838B8C811C17, fd1335;
mul.f64 fd1338, fd1310, 0dBFEF838B8C811C17;
mul.f64 fd1673, fd1304, 0d3FC63A1A7E0B738A;
sub.f64 fd1339, fd1673, fd1338;
mul.f64 fd1340, fd1310, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd1341, fd1304, 0dBFEF838B8C811C17, fd1340;
mul.f64 fd1343, fd1326, 0dBFD5E3A8748A0BF5;
mul.f64 fd1672, fd1320, 0dBFEE11F642522D1C;
sub.f64 fd1344, fd1672, fd1343;
mul.f64 fd1345, fd1326, 0dBFEE11F642522D1C;
fma.rn.f64 fd1346, fd1320, 0dBFD5E3A8748A0BF5, fd1345;
add.f64 fd1347, fd1296, fd1312;
add.f64 fd1348, fd1280, fd1347;
mul.f64 fd1351, fd1347, 0d3FE0000000000000;
sub.f64 fd1352, fd1280, fd1351;
add.f64 fd1671, fd1680, fd1678;
sub.f64 fd1353, fd1680, fd1678;
mul.f64 fd1354, fd1353, 0d3FEBB67AE8584CAA;
add.f64 fd1355, fd1354, fd1352;
sub.f64 fd1356, fd1352, fd1354;
add.f64 fd1670, fd1682, fd1671;
mul.f64 fd1357, fd1671, 0d3FE0000000000000;
sub.f64 fd1358, fd1682, fd1357;
sub.f64 fd1359, fd1296, fd1312;
mul.f64 fd1360, fd1359, 0d3FEBB67AE8584CAA;
sub.f64 fd1361, fd1358, fd1360;
add.f64 fd1362, fd1360, fd1358;
add.f64 fd1363, fd1329, fd1334;
add.f64 fd1364, fd1287, fd1363;
mul.f64 fd1367, fd1363, 0d3FE0000000000000;
sub.f64 fd1368, fd1287, fd1367;
add.f64 fd1669, fd1331, fd1336;
sub.f64 fd1369, fd1331, fd1336;
mul.f64 fd1370, fd1369, 0d3FEBB67AE8584CAA;
add.f64 fd1371, fd1370, fd1368;
sub.f64 fd1372, fd1368, fd1370;
add.f64 fd1668, fd1293, fd1669;
mul.f64 fd1373, fd1669, 0d3FE0000000000000;
sub.f64 fd1374, fd1293, fd1373;
sub.f64 fd1375, fd1329, fd1334;
mul.f64 fd1376, fd1375, 0d3FEBB67AE8584CAA;
sub.f64 fd1377, fd1374, fd1376;
add.f64 fd1378, fd1376, fd1374;
add.f64 fd1379, fd1339, fd1344;
add.f64 fd1380, fd1288, fd1379;
mul.f64 fd1383, fd1379, 0d3FE0000000000000;
sub.f64 fd1384, fd1288, fd1383;
add.f64 fd1667, fd1341, fd1346;
sub.f64 fd1385, fd1341, fd1346;
mul.f64 fd1386, fd1385, 0d3FEBB67AE8584CAA;
add.f64 fd1387, fd1386, fd1384;
sub.f64 fd1388, fd1384, fd1386;
add.f64 fd1666, fd1294, fd1667;
mul.f64 fd1389, fd1667, 0d3FE0000000000000;
sub.f64 fd1390, fd1294, fd1389;
sub.f64 fd1391, fd1339, fd1344;
mul.f64 fd1392, fd1391, 0d3FEBB67AE8584CAA;
sub.f64 fd1393, fd1390, fd1392;
add.f64 fd1394, fd1392, fd1390;
mul.f64 fd1396, fd1686, 0dBFCD84D223638000;
mul.f64 fd1665, fd1248, 0d3FEF232EFF15C9E6;
sub.f64 fd1397, fd1665, fd1396;
mul.f64 fd1398, fd1686, 0d3FEF232EFF15C9E6;
fma.rn.f64 fd1399, fd1248, 0dBFCD84D223638000, fd1398;
mul.f64 fd1663, fd1364, 0d3FEC98A37A9A7850;
mul.f64 fd1664, fd1668, 0dBFDCB920325BAFA6;
sub.f64 fd1402, fd1663, fd1664;
mul.f64 fd1403, fd1668, 0d3FEC98A37A9A7850;
fma.rn.f64 fd1404, fd1364, 0dBFDCB920325BAFA6, fd1403;
mul.f64 fd1661, fd1264, 0d3FEC98A37A9A7850;
mul.f64 fd1662, fd1684, 0dBFDCB920325BAFA6;
sub.f64 fd1407, fd1661, fd1662;
mul.f64 fd1408, fd1684, 0d3FEC98A37A9A7850;
fma.rn.f64 fd1409, fd1264, 0dBFDCB920325BAFA6, fd1408;
mul.f64 fd1659, fd1380, 0d3FE31BEC55BC71BC;
mul.f64 fd1660, fd1666, 0dBFE9AAFE4207DF5F;
sub.f64 fd1412, fd1659, fd1660;
mul.f64 fd1413, fd1666, 0d3FE31BEC55BC71BC;
fma.rn.f64 fd1414, fd1380, 0dBFE9AAFE4207DF5F, fd1413;
mul.f64 fd1657, fd1239, 0d3FE8836FA2CF5039;
mul.f64 fd1658, fd1245, 0dBFE491B7523C161D;
sub.f64 fd1417, fd1657, fd1658;
mul.f64 fd1418, fd1245, 0d3FE8836FA2CF5039;
fma.rn.f64 fd1419, fd1239, 0dBFE491B7523C161D, fd1418;
mul.f64 fd1421, fd1361, 0dBFEF838B8C811C17;
mul.f64 fd1656, fd1355, 0d3FC63A1A7E0B738A;
sub.f64 fd1422, fd1656, fd1421;
mul.f64 fd1423, fd1361, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd1424, fd1355, 0dBFEF838B8C811C17, fd1423;
mul.f64 fd1426, fd1261, 0dBFE9AAFE4207DF5F;
mul.f64 fd1655, fd1255, 0d3FE31BEC55BC71BC;
sub.f64 fd1427, fd1655, fd1426;
mul.f64 fd1428, fd1261, 0d3FE31BEC55BC71BC;
fma.rn.f64 fd1429, fd1255, 0dBFE9AAFE4207DF5F, fd1428;
mul.f64 fd1431, fd1377, 0dBFEEA7D99F29CADE;
mul.f64 fd1654, fd1371, 0dBFD25AFBF23865BF;
sub.f64 fd1432, fd1654, fd1431;
mul.f64 fd1433, fd1377, 0dBFD25AFBF23865BF;
fma.rn.f64 fd1434, fd1371, 0dBFEEA7D99F29CADE, fd1433;
mul.f64 fd1436, fd1277, 0dBFED6206BEB6C24B;
mul.f64 fd1653, fd1271, 0d3FD9595EF26FB670;
sub.f64 fd1437, fd1653, fd1436;
mul.f64 fd1438, fd1277, 0d3FD9595EF26FB670;
fma.rn.f64 fd1439, fd1271, 0dBFED6206BEB6C24B, fd1438;
mul.f64 fd1441, fd1393, 0dBFE746A51650EADE;
mul.f64 fd1652, fd1387, 0dBFE5F5B105F99707;
sub.f64 fd1442, fd1652, fd1441;
mul.f64 fd1443, fd1393, 0dBFE5F5B105F99707;
fma.rn.f64 fd1444, fd1387, 0dBFE746A51650EADE, fd1443;
mul.f64 fd1650, fd1240, 0d3FC63A1A7E0B738A;
mul.f64 fd1651, fd1246, 0dBFEF838B8C811C17;
sub.f64 fd1447, fd1650, fd1651;
mul.f64 fd1448, fd1246, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd1449, fd1240, 0dBFEF838B8C811C17, fd1448;
mul.f64 fd1648, fd1356, 0dBFEE11F642522D1C;
mul.f64 fd1649, fd1362, 0dBFD5E3A8748A0BF5;
sub.f64 fd1452, fd1648, fd1649;
mul.f64 fd1453, fd1362, 0dBFEE11F642522D1C;
fma.rn.f64 fd1454, fd1356, 0dBFD5E3A8748A0BF5, fd1453;
mul.f64 fd1646, fd1256, 0dBFADC528B5343A86;
mul.f64 fd1647, fd1262, 0dBFEFF223F3635CE3;
sub.f64 fd1457, fd1646, fd1647;
mul.f64 fd1458, fd1262, 0dBFADC528B5343A86;
fma.rn.f64 fd1459, fd1256, 0dBFEFF223F3635CE3, fd1458;
mul.f64 fd1644, fd1372, 0dBFEFC89BCEF44CF4;
mul.f64 fd1645, fd1378, 0d3FBDB843E577175E;
sub.f64 fd1462, fd1644, fd1645;
mul.f64 fd1463, fd1378, 0dBFEFC89BCEF44CF4;
fma.rn.f64 fd1464, fd1372, 0d3FBDB843E577175E, fd1463;
mul.f64 fd1466, fd1278, 0dBFEEA7D99F29CADE;
mul.f64 fd1643, fd1272, 0dBFD25AFBF23865BF;
sub.f64 fd1467, fd1643, fd1466;
mul.f64 fd1468, fd1278, 0dBFD25AFBF23865BF;
fma.rn.f64 fd1469, fd1272, 0dBFEEA7D99F29CADE, fd1468;
mul.f64 fd1471, fd1394, 0d3FE19593DA358510;
mul.f64 fd1642, fd1388, 0dBFEABC50EF4734A7;
sub.f64 fd1472, fd1642, fd1471;
mul.f64 fd1473, fd1394, 0dBFEABC50EF4734A7;
fma.rn.f64 fd1474, fd1388, 0d3FE19593DA358510, fd1473;
add.f64 fd1475, fd1232, fd1348;
mul.f64 fd1477, fd1475, 0d3FE0000000000000;
sub.f64 fd1478, fd1116, fd1477;
add.f64 fd1641, fd1688, fd1670;
sub.f64 fd1479, fd1688, fd1670;
mul.f64 fd1480, fd1479, 0d3FEBB67AE8584CAA;
mul.f64 fd1481, fd1641, 0d3FE0000000000000;
sub.f64 fd1482, fd1705, fd1481;
sub.f64 fd1483, fd1232, fd1348;
mul.f64 fd1484, fd1483, 0d3FEBB67AE8584CAA;
add.f64 fd1485, fd1397, fd1402;
mul.f64 fd1487, fd1485, 0d3FE0000000000000;
sub.f64 fd1488, fd1132, fd1487;
add.f64 fd1640, fd1399, fd1404;
sub.f64 fd1489, fd1399, fd1404;
mul.f64 fd1490, fd1489, 0d3FEBB67AE8584CAA;
mul.f64 fd1491, fd1640, 0d3FE0000000000000;
sub.f64 fd1492, fd1703, fd1491;
sub.f64 fd1493, fd1397, fd1402;
mul.f64 fd1494, fd1493, 0d3FEBB67AE8584CAA;
add.f64 fd1495, fd1407, fd1412;
mul.f64 fd1497, fd1495, 0d3FE0000000000000;
sub.f64 fd1498, fd1148, fd1497;
add.f64 fd1639, fd1409, fd1414;
sub.f64 fd1499, fd1409, fd1414;
mul.f64 fd1500, fd1499, 0d3FEBB67AE8584CAA;
mul.f64 fd1501, fd1639, 0d3FE0000000000000;
sub.f64 fd1502, fd1701, fd1501;
sub.f64 fd1503, fd1407, fd1412;
mul.f64 fd1504, fd1503, 0d3FEBB67AE8584CAA;
add.f64 fd1505, fd1417, fd1422;
mul.f64 fd1507, fd1505, 0d3FE0000000000000;
sub.f64 fd1508, fd1123, fd1507;
add.f64 fd1638, fd1419, fd1424;
sub.f64 fd1509, fd1419, fd1424;
mul.f64 fd1510, fd1509, 0d3FEBB67AE8584CAA;
mul.f64 fd1511, fd1638, 0d3FE0000000000000;
sub.f64 fd1512, fd1129, fd1511;
sub.f64 fd1513, fd1417, fd1422;
mul.f64 fd1514, fd1513, 0d3FEBB67AE8584CAA;
add.f64 fd1515, fd1427, fd1432;
mul.f64 fd1517, fd1515, 0d3FE0000000000000;
sub.f64 fd1518, fd1139, fd1517;
add.f64 fd1637, fd1429, fd1434;
sub.f64 fd1519, fd1429, fd1434;
mul.f64 fd1520, fd1519, 0d3FEBB67AE8584CAA;
mul.f64 fd1521, fd1637, 0d3FE0000000000000;
sub.f64 fd1522, fd1145, fd1521;
sub.f64 fd1523, fd1427, fd1432;
mul.f64 fd1524, fd1523, 0d3FEBB67AE8584CAA;
add.f64 fd1525, fd1437, fd1442;
mul.f64 fd1527, fd1525, 0d3FE0000000000000;
sub.f64 fd1528, fd1155, fd1527;
add.f64 fd1636, fd1439, fd1444;
sub.f64 fd1529, fd1439, fd1444;
mul.f64 fd1530, fd1529, 0d3FEBB67AE8584CAA;
mul.f64 fd1531, fd1636, 0d3FE0000000000000;
sub.f64 fd1532, fd1161, fd1531;
sub.f64 fd1533, fd1437, fd1442;
mul.f64 fd1534, fd1533, 0d3FEBB67AE8584CAA;
add.f64 fd1535, fd1447, fd1452;
mul.f64 fd1537, fd1535, 0d3FE0000000000000;
sub.f64 fd1538, fd1124, fd1537;
add.f64 fd1635, fd1449, fd1454;
sub.f64 fd1539, fd1449, fd1454;
mul.f64 fd1540, fd1539, 0d3FEBB67AE8584CAA;
mul.f64 fd1541, fd1635, 0d3FE0000000000000;
sub.f64 fd1542, fd1130, fd1541;
sub.f64 fd1543, fd1447, fd1452;
mul.f64 fd1544, fd1543, 0d3FEBB67AE8584CAA;
add.f64 fd1545, fd1457, fd1462;
mul.f64 fd1547, fd1545, 0d3FE0000000000000;
sub.f64 fd1548, fd1140, fd1547;
add.f64 fd1634, fd1459, fd1464;
sub.f64 fd1549, fd1459, fd1464;
mul.f64 fd1550, fd1549, 0d3FEBB67AE8584CAA;
mul.f64 fd1551, fd1634, 0d3FE0000000000000;
sub.f64 fd1552, fd1146, fd1551;
sub.f64 fd1553, fd1457, fd1462;
mul.f64 fd1554, fd1553, 0d3FEBB67AE8584CAA;
add.f64 fd1555, fd1467, fd1472;
mul.f64 fd1557, fd1555, 0d3FE0000000000000;
sub.f64 fd1558, fd1156, fd1557;
add.f64 fd1633, fd1469, fd1474;
sub.f64 fd1559, fd1469, fd1474;
mul.f64 fd1560, fd1559, 0d3FEBB67AE8584CAA;
mul.f64 fd1561, fd1633, 0d3FE0000000000000;
sub.f64 fd1562, fd1162, fd1561;
sub.f64 fd1563, fd1467, fd1472;
mul.f64 fd1564, fd1563, 0d3FEBB67AE8584CAA;
add.f64 %1, fd1705, fd1641;
add.f64 %0, fd1116, fd1475;
add.f64 %3, fd1703, fd1640;
add.f64 %2, fd1132, fd1485;
add.f64 %5, fd1701, fd1639;
add.f64 %4, fd1148, fd1495;
add.f64 %7, fd1129, fd1638;
add.f64 %6, fd1123, fd1505;
add.f64 %9, fd1145, fd1637;
add.f64 %8, fd1139, fd1515;
add.f64 %11, fd1161, fd1636;
add.f64 %10, fd1155, fd1525;
add.f64 %13, fd1130, fd1635;
add.f64 %12, fd1124, fd1535;
add.f64 %15, fd1146, fd1634;
add.f64 %14, fd1140, fd1545;
add.f64 %17, fd1162, fd1633;
add.f64 %16, fd1156, fd1555;
sub.f64 %19, fd1482, fd1484;
add.f64 %18, fd1480, fd1478;
sub.f64 %21, fd1492, fd1494;
add.f64 %20, fd1490, fd1488;
add.f64 %22, fd1500, fd1498;
sub.f64 %23, fd1502, fd1504;
add.f64 %24, fd1510, fd1508;
sub.f64 %25, fd1512, fd1514;
add.f64 %26, fd1520, fd1518;
sub.f64 %27, fd1522, fd1524;
add.f64 %28, fd1530, fd1528;
sub.f64 %29, fd1532, fd1534;
sub.f64 %31, fd1542, fd1544;
add.f64 %30, fd1540, fd1538;
sub.f64 %33, fd1552, fd1554;
add.f64 %32, fd1550, fd1548;
sub.f64 %35, fd1562, fd1564;
add.f64 %34, fd1560, fd1558;
add.f64 %37, fd1484, fd1482;
sub.f64 %36, fd1478, fd1480;
add.f64 %39, fd1494, fd1492;
sub.f64 %38, fd1488, fd1490;
add.f64 %41, fd1504, fd1502;
sub.f64 %40, fd1498, fd1500;
add.f64 %43, fd1514, fd1512;
sub.f64 %42, fd1508, fd1510;
add.f64 %45, fd1524, fd1522;
sub.f64 %44, fd1518, fd1520;
add.f64 %47, fd1534, fd1532;
sub.f64 %46, fd1528, fd1530;
add.f64 %49, fd1544, fd1542;
sub.f64 %48, fd1538, fd1540;
add.f64 %51, fd1554, fd1552;
sub.f64 %50, fd1548, fd1550;
add.f64 %53, fd1564, fd1562;
sub.f64 %52, fd1558, fd1560;
})"
     : "=d"(rmem[0].x), "=d"(rmem[0].y), "=d"(rmem[1].x), "=d"(rmem[1].y), "=d"(rmem[2].x), "=d"(rmem[2].y), "=d"(rmem[3].x), "=d"(rmem[3].y), "=d"(rmem[4].x), "=d"(rmem[4].y), "=d"(rmem[5].x), "=d"(rmem[5].y), "=d"(rmem[6].x), "=d"(rmem[6].y), "=d"(rmem[7].x), "=d"(rmem[7].y), "=d"(rmem[8].x), "=d"(rmem[8].y), "=d"(rmem[9].x), "=d"(rmem[9].y), "=d"(rmem[10].x), "=d"(rmem[10].y), "=d"(rmem[11].x), "=d"(rmem[11].y), "=d"(rmem[12].x), "=d"(rmem[12].y), "=d"(rmem[13].x), "=d"(rmem[13].y), "=d"(rmem[14].x), "=d"(rmem[14].y), "=d"(rmem[15].x), "=d"(rmem[15].y), "=d"(rmem[16].x), "=d"(rmem[16].y), "=d"(rmem[17].x), "=d"(rmem[17].y), "=d"(rmem[18].x), "=d"(rmem[18].y), "=d"(rmem[19].x), "=d"(rmem[19].y), "=d"(rmem[20].x), "=d"(rmem[20].y), "=d"(rmem[21].x), "=d"(rmem[21].y), "=d"(rmem[22].x), "=d"(rmem[22].y), "=d"(rmem[23].x), "=d"(rmem[23].y), "=d"(rmem[24].x), "=d"(rmem[24].y), "=d"(rmem[25].x), "=d"(rmem[25].y), "=d"(rmem[26].x), "=d"(rmem[26].y): "r"(smem), "l"(lut_dp_27_729), "d"(rmem[0].x), "d"(rmem[0].y), "d"(rmem[1].x), "d"(rmem[1].y), "d"(rmem[2].x), "d"(rmem[2].y), "d"(rmem[3].x), "d"(rmem[3].y), "d"(rmem[4].x), "d"(rmem[4].y), "d"(rmem[5].x), "d"(rmem[5].y), "d"(rmem[6].x), "d"(rmem[6].y), "d"(rmem[7].x), "d"(rmem[7].y), "d"(rmem[8].x), "d"(rmem[8].y), "d"(rmem[9].x), "d"(rmem[9].y), "d"(rmem[10].x), "d"(rmem[10].y), "d"(rmem[11].x), "d"(rmem[11].y), "d"(rmem[12].x), "d"(rmem[12].y), "d"(rmem[13].x), "d"(rmem[13].y), "d"(rmem[14].x), "d"(rmem[14].y), "d"(rmem[15].x), "d"(rmem[15].y), "d"(rmem[16].x), "d"(rmem[16].y), "d"(rmem[17].x), "d"(rmem[17].y), "d"(rmem[18].x), "d"(rmem[18].y), "d"(rmem[19].x), "d"(rmem[19].y), "d"(rmem[20].x), "d"(rmem[20].y), "d"(rmem[21].x), "d"(rmem[21].y), "d"(rmem[22].x), "d"(rmem[22].y), "d"(rmem[23].x), "d"(rmem[23].y), "d"(rmem[24].x), "d"(rmem[24].y), "d"(rmem[25].x), "d"(rmem[25].y), "d"(rmem[26].x), "d"(rmem[26].y), "d"(rmem[10].y), "d"(rmem[19].y), "d"(rmem[1].y), "d"(rmem[22].y), "d"(rmem[13].y), "d"(rmem[4].y), "d"(rmem[16].y), "d"(rmem[25].y), "d"(rmem[7].y), "d"(rmem[11].y), "d"(rmem[20].y), "d"(rmem[2].y), "d"(rmem[23].y), "d"(rmem[14].y), "d"(rmem[5].y), "d"(rmem[17].y), "d"(rmem[8].y));
};




template<> __forceinline__ __device__ void cufftdx_private_function<521, double, 1>(cufftdx::detail::complex<double> *rmem, unsigned smem){

asm volatile (R"({
.reg .b32 r<18>;
.reg .f64 fd<613>;
.reg .b64 rd<12>;
mov.u32 r1, %tid.y;
mov.u32 r2, %18;
mad.lo.s32 r3, r1, 11664, r2;
add.f64 fd37, %29, %37;
add.f64 fd38, %21, fd37;
add.f64 fd39, %30, %38;
add.f64 fd40, %22, fd39;
mul.f64 fd41, fd37, 0d3FE0000000000000;
sub.f64 fd42, %21, fd41;
sub.f64 fd43, %30, %38;
mul.f64 fd44, fd43, 0d3FEBB67AE8584CAA;
add.f64 fd45, fd44, fd42;
sub.f64 fd46, fd42, fd44;
mul.f64 fd47, fd39, 0d3FE0000000000000;
sub.f64 fd48, %22, fd47;
sub.f64 fd49, %29, %37;
mul.f64 fd50, fd49, 0d3FEBB67AE8584CAA;
sub.f64 fd51, fd48, fd50;
add.f64 fd52, fd50, fd48;
add.f64 fd53, %31, %39;
add.f64 fd54, %23, fd53;
add.f64 fd55, %33, %41;
add.f64 fd56, %25, fd55;
mul.f64 fd57, fd53, 0d3FE0000000000000;
sub.f64 fd58, %23, fd57;
sub.f64 fd59, %33, %41;
mul.f64 fd60, fd59, 0d3FEBB67AE8584CAA;
add.f64 fd61, fd60, fd58;
sub.f64 fd62, fd58, fd60;
mul.f64 fd63, fd55, 0d3FE0000000000000;
sub.f64 fd64, %25, fd63;
sub.f64 fd65, %31, %39;
mul.f64 fd66, fd65, 0d3FEBB67AE8584CAA;
sub.f64 fd67, fd64, fd66;
add.f64 fd68, fd66, fd64;
add.f64 fd69, %34, %42;
add.f64 fd70, %26, fd69;
add.f64 fd71, %36, %43;
add.f64 fd72, %28, fd71;
mul.f64 fd73, fd69, 0d3FE0000000000000;
sub.f64 fd74, %26, fd73;
sub.f64 fd75, %36, %43;
mul.f64 fd76, fd75, 0d3FEBB67AE8584CAA;
add.f64 fd77, fd76, fd74;
sub.f64 fd78, fd74, fd76;
mul.f64 fd79, fd71, 0d3FE0000000000000;
sub.f64 fd80, %28, fd79;
sub.f64 fd81, %34, %42;
mul.f64 fd82, fd81, 0d3FEBB67AE8584CAA;
sub.f64 fd83, fd80, fd82;
add.f64 fd84, fd82, fd80;
mov.u32 r4, %tid.x;
mul.f64 fd85, fd61, 0d3FE8836FA2CF5039;
mul.f64 fd86, fd67, 0dBFE491B7523C161D;
sub.f64 fd87, fd85, fd86;
mul.f64 fd88, fd67, 0d3FE8836FA2CF5039;
fma.rn.f64 fd89, fd61, 0dBFE491B7523C161D, fd88;
mul.f64 fd90, fd77, 0d3FC63A1A7E0B738A;
mul.f64 fd91, fd83, 0dBFEF838B8C811C17;
sub.f64 fd92, fd90, fd91;
mul.f64 fd93, fd83, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd94, fd77, 0dBFEF838B8C811C17, fd93;
mul.f64 fd95, fd62, 0d3FC63A1A7E0B738A;
mul.f64 fd96, fd68, 0dBFEF838B8C811C17;
sub.f64 fd97, fd95, fd96;
mul.f64 fd98, fd68, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd99, fd62, 0dBFEF838B8C811C17, fd98;
mul.f64 fd100, fd78, 0dBFEE11F642522D1C;
mul.f64 fd101, fd84, 0dBFD5E3A8748A0BF5;
sub.f64 fd102, fd100, fd101;
mul.f64 fd103, fd84, 0dBFEE11F642522D1C;
fma.rn.f64 fd104, fd78, 0dBFD5E3A8748A0BF5, fd103;
add.f64 fd105, fd54, fd70;
add.f64 fd106, fd56, fd72;
mul.f64 fd107, fd105, 0d3FE0000000000000;
sub.f64 fd108, fd38, fd107;
sub.f64 fd109, fd56, fd72;
mul.f64 fd110, fd109, 0d3FEBB67AE8584CAA;
add.f64 fd111, fd110, fd108;
sub.f64 fd112, fd108, fd110;
mul.f64 fd113, fd106, 0d3FE0000000000000;
sub.f64 fd114, fd40, fd113;
sub.f64 fd115, fd54, fd70;
mul.f64 fd116, fd115, 0d3FEBB67AE8584CAA;
sub.f64 fd117, fd114, fd116;
add.f64 fd118, fd116, fd114;
add.f64 fd119, fd87, fd92;
add.f64 fd120, fd45, fd119;
add.f64 fd121, fd89, fd94;
add.f64 fd122, fd51, fd121;
mul.f64 fd123, fd119, 0d3FE0000000000000;
sub.f64 fd124, fd45, fd123;
sub.f64 fd125, fd89, fd94;
mul.f64 fd126, fd125, 0d3FEBB67AE8584CAA;
add.f64 fd127, fd126, fd124;
sub.f64 fd128, fd124, fd126;
mul.f64 fd129, fd121, 0d3FE0000000000000;
sub.f64 fd130, fd51, fd129;
sub.f64 fd131, fd87, fd92;
mul.f64 fd132, fd131, 0d3FEBB67AE8584CAA;
sub.f64 fd133, fd130, fd132;
add.f64 fd134, fd132, fd130;
add.f64 fd135, fd97, fd102;
add.f64 fd136, fd46, fd135;
add.f64 fd137, fd99, fd104;
add.f64 fd138, fd52, fd137;
mul.f64 fd139, fd135, 0d3FE0000000000000;
sub.f64 fd140, fd46, fd139;
sub.f64 fd141, fd99, fd104;
mul.f64 fd142, fd141, 0d3FEBB67AE8584CAA;
add.f64 fd143, fd142, fd140;
sub.f64 fd144, fd140, fd142;
mul.f64 fd145, fd137, 0d3FE0000000000000;
sub.f64 fd146, fd52, fd145;
sub.f64 fd147, fd97, fd102;
mul.f64 fd148, fd147, 0d3FEBB67AE8584CAA;
sub.f64 fd149, fd146, fd148;
add.f64 fd150, fd148, fd146;
mul.wide.u32 rd2, r4, -901412889;
shr.u64 rd3, rd2, 38;
cvt.u32.u64 r5, rd3;
mul.lo.s32 r6, r5, 81;
sub.s32 r7, r4, r6;
mad.lo.s32 r8, r5, 11664, r3;
mul.wide.u32 rd4, r7, 16;
mov.u64 rd5, %19;
add.s64 rd6, rd5, rd4;
ld.global.v2.f64 {fd151, fd152}, [rd6];
mul.f64 fd155, fd151, fd120;
mul.f64 fd156, fd152, fd122;
mul.f64 fd157, fd151, fd122;
mul.f64 fd158, fd151, fd151;
mul.f64 fd159, fd152, fd152;
sub.f64 fd160, fd158, fd159;
mul.f64 fd161, fd152, fd151;
fma.rn.f64 fd162, fd152, fd151, fd161;
mul.f64 fd163, fd160, fd136;
mul.f64 fd164, fd162, fd138;
mul.f64 fd165, fd160, fd138;
mul.f64 fd166, fd151, fd160;
mul.f64 fd167, fd152, fd162;
sub.f64 fd168, fd166, fd167;
mul.f64 fd169, fd151, fd162;
fma.rn.f64 fd170, fd152, fd160, fd169;
mul.f64 fd171, fd168, fd111;
mul.f64 fd172, fd170, fd117;
mul.f64 fd173, fd168, fd117;
mul.f64 fd174, fd151, fd168;
mul.f64 fd175, fd152, fd170;
sub.f64 fd176, fd174, fd175;
mul.f64 fd177, fd151, fd170;
fma.rn.f64 fd178, fd152, fd168, fd177;
mul.f64 fd179, fd176, fd127;
mul.f64 fd180, fd178, fd133;
mul.f64 fd181, fd176, fd133;
ld.global.v2.f64 {fd182, fd183}, [rd6+1296];
mul.f64 fd186, fd182, fd143;
mul.f64 fd187, fd183, fd149;
mul.f64 fd188, fd182, fd149;
mul.f64 fd189, fd151, fd182;
mul.f64 fd190, fd152, fd183;
sub.f64 fd191, fd189, fd190;
mul.f64 fd192, fd151, fd183;
fma.rn.f64 fd193, fd152, fd182, fd192;
mul.f64 fd194, fd191, fd112;
mul.f64 fd195, fd193, fd118;
mul.f64 fd196, fd191, fd118;
mul.f64 fd197, fd151, fd191;
mul.f64 fd198, fd152, fd193;
sub.f64 fd199, fd197, fd198;
mul.f64 fd200, fd151, fd193;
fma.rn.f64 fd201, fd152, fd191, fd200;
mul.f64 fd202, fd199, fd128;
mul.f64 fd203, fd201, fd134;
mul.f64 fd204, fd199, fd134;
mul.f64 fd205, fd151, fd199;
mul.f64 fd206, fd152, fd201;
sub.f64 fd207, fd205, fd206;
mul.f64 fd208, fd151, fd201;
fma.rn.f64 fd209, fd152, fd199, fd208;
mul.f64 fd210, fd207, fd144;
mul.f64 fd211, fd209, fd150;
mul.f64 fd212, fd207, fd150;
barrier.sync 0;
mad.lo.s32 r9, r7, 144, r8;
add.f64 fd213, fd40, fd106;
add.f64 fd214, fd38, fd105;
st.shared.v2.f64 [r9], {fd214, fd213};
fma.rn.f64 fd215, fd152, fd120, fd157;
sub.f64 fd216, fd155, fd156;
st.shared.v2.f64 [r9+16], {fd216, fd215};
fma.rn.f64 fd217, fd162, fd136, fd165;
sub.f64 fd218, fd163, fd164;
st.shared.v2.f64 [r9+32], {fd218, fd217};
sub.f64 fd219, fd171, fd172;
fma.rn.f64 fd220, fd170, fd111, fd173;
st.shared.v2.f64 [r9+48], {fd219, fd220};
fma.rn.f64 fd221, fd178, fd127, fd181;
sub.f64 fd222, fd179, fd180;
st.shared.v2.f64 [r9+64], {fd222, fd221};
fma.rn.f64 fd223, fd183, fd143, fd188;
sub.f64 fd224, fd186, fd187;
st.shared.v2.f64 [r9+80], {fd224, fd223};
fma.rn.f64 fd225, fd193, fd112, fd196;
sub.f64 fd226, fd194, fd195;
st.shared.v2.f64 [r9+96], {fd226, fd225};
fma.rn.f64 fd227, fd201, fd128, fd204;
sub.f64 fd228, fd202, fd203;
st.shared.v2.f64 [r9+112], {fd228, fd227};
fma.rn.f64 fd229, fd209, fd144, fd212;
sub.f64 fd230, fd210, fd211;
st.shared.v2.f64 [r9+128], {fd230, fd229};
barrier.sync 0;
shl.b32 r10, r7, 7;
sub.s32 r11, r9, r10;
ld.shared.v2.f64 {fd231, fd232}, [r11];
ld.shared.v2.f64 {fd235, fd236}, [r11+1296];
ld.shared.v2.f64 {fd239, fd240}, [r11+2592];
ld.shared.v2.f64 {fd243, fd244}, [r11+3888];
ld.shared.v2.f64 {fd247, fd248}, [r11+5184];
ld.shared.v2.f64 {fd251, fd252}, [r11+6480];
ld.shared.v2.f64 {fd255, fd256}, [r11+7776];
ld.shared.v2.f64 {fd259, fd260}, [r11+9072];
ld.shared.v2.f64 {fd263, fd264}, [r11+10368];
add.f64 fd267, fd243, fd255;
add.f64 fd268, fd231, fd267;
add.f64 fd269, fd244, fd256;
add.f64 fd270, fd232, fd269;
mul.f64 fd271, fd267, 0d3FE0000000000000;
sub.f64 fd272, fd231, fd271;
sub.f64 fd273, fd244, fd256;
mul.f64 fd274, fd273, 0d3FEBB67AE8584CAA;
add.f64 fd275, fd274, fd272;
sub.f64 fd276, fd272, fd274;
mul.f64 fd277, fd269, 0d3FE0000000000000;
sub.f64 fd278, fd232, fd277;
sub.f64 fd279, fd243, fd255;
mul.f64 fd280, fd279, 0d3FEBB67AE8584CAA;
sub.f64 fd281, fd278, fd280;
add.f64 fd282, fd280, fd278;
add.f64 fd283, fd247, fd259;
add.f64 fd284, fd235, fd283;
add.f64 fd285, fd248, fd260;
add.f64 fd286, fd236, fd285;
mul.f64 fd287, fd283, 0d3FE0000000000000;
sub.f64 fd288, fd235, fd287;
sub.f64 fd289, fd248, fd260;
mul.f64 fd290, fd289, 0d3FEBB67AE8584CAA;
add.f64 fd291, fd290, fd288;
sub.f64 fd292, fd288, fd290;
mul.f64 fd293, fd285, 0d3FE0000000000000;
sub.f64 fd294, fd236, fd293;
sub.f64 fd295, fd247, fd259;
mul.f64 fd296, fd295, 0d3FEBB67AE8584CAA;
sub.f64 fd297, fd294, fd296;
add.f64 fd298, fd296, fd294;
add.f64 fd299, fd251, fd263;
add.f64 fd300, fd239, fd299;
add.f64 fd301, fd252, fd264;
add.f64 fd302, fd240, fd301;
mul.f64 fd303, fd299, 0d3FE0000000000000;
sub.f64 fd304, fd239, fd303;
sub.f64 fd305, fd252, fd264;
mul.f64 fd306, fd305, 0d3FEBB67AE8584CAA;
add.f64 fd307, fd306, fd304;
sub.f64 fd308, fd304, fd306;
mul.f64 fd309, fd301, 0d3FE0000000000000;
sub.f64 fd310, fd240, fd309;
sub.f64 fd311, fd251, fd263;
mul.f64 fd312, fd311, 0d3FEBB67AE8584CAA;
sub.f64 fd313, fd310, fd312;
add.f64 fd314, fd312, fd310;
mul.f64 fd315, fd291, 0d3FE8836FA2CF5039;
mul.f64 fd316, fd297, 0dBFE491B7523C161D;
sub.f64 fd317, fd315, fd316;
mul.f64 fd318, fd297, 0d3FE8836FA2CF5039;
fma.rn.f64 fd319, fd291, 0dBFE491B7523C161D, fd318;
mul.f64 fd320, fd307, 0d3FC63A1A7E0B738A;
mul.f64 fd321, fd313, 0dBFEF838B8C811C17;
sub.f64 fd322, fd320, fd321;
mul.f64 fd323, fd313, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd324, fd307, 0dBFEF838B8C811C17, fd323;
mul.f64 fd325, fd292, 0d3FC63A1A7E0B738A;
mul.f64 fd326, fd298, 0dBFEF838B8C811C17;
sub.f64 fd327, fd325, fd326;
mul.f64 fd328, fd298, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd329, fd292, 0dBFEF838B8C811C17, fd328;
mul.f64 fd330, fd308, 0dBFEE11F642522D1C;
mul.f64 fd331, fd314, 0dBFD5E3A8748A0BF5;
sub.f64 fd332, fd330, fd331;
mul.f64 fd333, fd314, 0dBFEE11F642522D1C;
fma.rn.f64 fd334, fd308, 0dBFD5E3A8748A0BF5, fd333;
add.f64 fd335, fd284, fd300;
add.f64 fd336, fd286, fd302;
mul.f64 fd337, fd335, 0d3FE0000000000000;
sub.f64 fd338, fd268, fd337;
sub.f64 fd339, fd286, fd302;
mul.f64 fd340, fd339, 0d3FEBB67AE8584CAA;
add.f64 fd341, fd340, fd338;
sub.f64 fd342, fd338, fd340;
mul.f64 fd343, fd336, 0d3FE0000000000000;
sub.f64 fd344, fd270, fd343;
sub.f64 fd345, fd284, fd300;
mul.f64 fd346, fd345, 0d3FEBB67AE8584CAA;
sub.f64 fd347, fd344, fd346;
add.f64 fd348, fd346, fd344;
add.f64 fd349, fd317, fd322;
add.f64 fd350, fd275, fd349;
add.f64 fd351, fd319, fd324;
add.f64 fd352, fd281, fd351;
mul.f64 fd353, fd349, 0d3FE0000000000000;
sub.f64 fd354, fd275, fd353;
sub.f64 fd355, fd319, fd324;
mul.f64 fd356, fd355, 0d3FEBB67AE8584CAA;
add.f64 fd357, fd356, fd354;
sub.f64 fd358, fd354, fd356;
mul.f64 fd359, fd351, 0d3FE0000000000000;
sub.f64 fd360, fd281, fd359;
sub.f64 fd361, fd317, fd322;
mul.f64 fd362, fd361, 0d3FEBB67AE8584CAA;
sub.f64 fd363, fd360, fd362;
add.f64 fd364, fd362, fd360;
add.f64 fd365, fd327, fd332;
add.f64 fd366, fd276, fd365;
add.f64 fd367, fd329, fd334;
add.f64 fd368, fd282, fd367;
mul.f64 fd369, fd365, 0d3FE0000000000000;
sub.f64 fd370, fd276, fd369;
sub.f64 fd371, fd329, fd334;
mul.f64 fd372, fd371, 0d3FEBB67AE8584CAA;
add.f64 fd373, fd372, fd370;
sub.f64 fd374, fd370, fd372;
mul.f64 fd375, fd367, 0d3FE0000000000000;
sub.f64 fd376, fd282, fd375;
sub.f64 fd377, fd327, fd332;
mul.f64 fd378, fd377, 0d3FEBB67AE8584CAA;
sub.f64 fd379, fd376, fd378;
add.f64 fd380, fd378, fd376;
mul.wide.u32 rd7, r7, 954437177;
shr.u64 rd8, rd7, 33;
cvt.u32.u64 r12, rd8;
mul.lo.s32 r13, r12, 9;
sub.s32 r14, r7, r13;
mul.wide.u32 rd9, r12, 16;
mov.u64 rd10, %20;
add.s64 rd11, rd10, rd9;
ld.global.v2.f64 {fd381, fd382}, [rd11];
mul.f64 fd385, fd381, fd350;
mul.f64 fd386, fd382, fd352;
mul.f64 fd387, fd381, fd352;
mul.f64 fd388, fd381, fd381;
mul.f64 fd389, fd382, fd382;
sub.f64 fd390, fd388, fd389;
mul.f64 fd391, fd382, fd381;
fma.rn.f64 fd392, fd382, fd381, fd391;
mul.f64 fd393, fd390, fd366;
mul.f64 fd394, fd392, fd368;
mul.f64 fd395, fd390, fd368;
mul.f64 fd396, fd381, fd390;
mul.f64 fd397, fd382, fd392;
sub.f64 fd398, fd396, fd397;
mul.f64 fd399, fd381, fd392;
fma.rn.f64 fd400, fd382, fd390, fd399;
mul.f64 fd401, fd398, fd341;
mul.f64 fd402, fd400, fd347;
mul.f64 fd403, fd398, fd347;
mul.f64 fd404, fd381, fd398;
mul.f64 fd405, fd382, fd400;
sub.f64 fd406, fd404, fd405;
mul.f64 fd407, fd381, fd400;
fma.rn.f64 fd408, fd382, fd398, fd407;
mul.f64 fd409, fd406, fd357;
mul.f64 fd410, fd408, fd363;
mul.f64 fd411, fd406, fd363;
ld.global.v2.f64 {fd412, fd413}, [rd11+144];
mul.f64 fd416, fd412, fd373;
mul.f64 fd417, fd413, fd379;
mul.f64 fd418, fd412, fd379;
mul.f64 fd419, fd381, fd412;
mul.f64 fd420, fd382, fd413;
sub.f64 fd421, fd419, fd420;
mul.f64 fd422, fd381, fd413;
fma.rn.f64 fd423, fd382, fd412, fd422;
mul.f64 fd424, fd421, fd342;
mul.f64 fd425, fd423, fd348;
mul.f64 fd426, fd421, fd348;
mul.f64 fd427, fd381, fd421;
mul.f64 fd428, fd382, fd423;
sub.f64 fd429, fd427, fd428;
mul.f64 fd430, fd381, fd423;
fma.rn.f64 fd431, fd382, fd421, fd430;
mul.f64 fd432, fd429, fd358;
mul.f64 fd433, fd431, fd364;
mul.f64 fd434, fd429, fd364;
mul.f64 fd435, fd381, fd429;
mul.f64 fd436, fd382, fd431;
sub.f64 fd437, fd435, fd436;
mul.f64 fd438, fd381, fd431;
fma.rn.f64 fd439, fd382, fd429, fd438;
mul.f64 fd440, fd437, fd374;
mul.f64 fd441, fd439, fd380;
mul.f64 fd442, fd437, fd380;
shl.b32 r15, r14, 4;
add.s32 r16, r8, r15;
barrier.sync 0;
mad.lo.s32 r17, r12, 1296, r16;
add.f64 fd443, fd270, fd336;
add.f64 fd444, fd268, fd335;
st.shared.v2.f64 [r17], {fd444, fd443};
fma.rn.f64 fd445, fd382, fd350, fd387;
sub.f64 fd446, fd385, fd386;
st.shared.v2.f64 [r17+144], {fd446, fd445};
fma.rn.f64 fd447, fd392, fd366, fd395;
sub.f64 fd448, fd393, fd394;
st.shared.v2.f64 [r17+288], {fd448, fd447};
fma.rn.f64 fd449, fd400, fd341, fd403;
sub.f64 fd450, fd401, fd402;
st.shared.v2.f64 [r17+432], {fd450, fd449};
fma.rn.f64 fd451, fd408, fd357, fd411;
sub.f64 fd452, fd409, fd410;
st.shared.v2.f64 [r17+576], {fd452, fd451};
fma.rn.f64 fd453, fd413, fd373, fd418;
sub.f64 fd454, fd416, fd417;
st.shared.v2.f64 [r17+720], {fd454, fd453};
fma.rn.f64 fd455, fd423, fd342, fd426;
sub.f64 fd456, fd424, fd425;
st.shared.v2.f64 [r17+864], {fd456, fd455};
fma.rn.f64 fd457, fd431, fd358, fd434;
sub.f64 fd458, fd432, fd433;
st.shared.v2.f64 [r17+1008], {fd458, fd457};
fma.rn.f64 fd459, fd439, fd374, fd442;
sub.f64 fd460, fd440, fd441;
st.shared.v2.f64 [r17+1152], {fd460, fd459};
barrier.sync 0;
ld.shared.v2.f64 {fd461, fd462}, [r11];
ld.shared.v2.f64 {fd465, fd466}, [r11+1296];
ld.shared.v2.f64 {fd469, fd470}, [r11+2592];
ld.shared.v2.f64 {fd473, fd474}, [r11+3888];
ld.shared.v2.f64 {fd477, fd478}, [r11+5184];
ld.shared.v2.f64 {fd481, fd482}, [r11+6480];
ld.shared.v2.f64 {fd485, fd486}, [r11+7776];
ld.shared.v2.f64 {fd489, fd490}, [r11+9072];
ld.shared.v2.f64 {fd493, fd494}, [r11+10368];
add.f64 fd497, fd473, fd485;
add.f64 fd498, fd461, fd497;
add.f64 fd499, fd474, fd486;
add.f64 fd500, fd462, fd499;
mul.f64 fd501, fd497, 0d3FE0000000000000;
sub.f64 fd502, fd461, fd501;
sub.f64 fd503, fd474, fd486;
mul.f64 fd504, fd503, 0d3FEBB67AE8584CAA;
add.f64 fd505, fd504, fd502;
sub.f64 fd506, fd502, fd504;
mul.f64 fd507, fd499, 0d3FE0000000000000;
sub.f64 fd508, fd462, fd507;
sub.f64 fd509, fd473, fd485;
mul.f64 fd510, fd509, 0d3FEBB67AE8584CAA;
sub.f64 fd511, fd508, fd510;
add.f64 fd512, fd510, fd508;
add.f64 fd513, fd477, fd489;
add.f64 fd514, fd465, fd513;
add.f64 fd515, fd478, fd490;
add.f64 fd516, fd466, fd515;
mul.f64 fd517, fd513, 0d3FE0000000000000;
sub.f64 fd518, fd465, fd517;
sub.f64 fd519, fd478, fd490;
mul.f64 fd520, fd519, 0d3FEBB67AE8584CAA;
add.f64 fd521, fd520, fd518;
sub.f64 fd522, fd518, fd520;
mul.f64 fd523, fd515, 0d3FE0000000000000;
sub.f64 fd524, fd466, fd523;
sub.f64 fd525, fd477, fd489;
mul.f64 fd526, fd525, 0d3FEBB67AE8584CAA;
sub.f64 fd527, fd524, fd526;
add.f64 fd528, fd526, fd524;
add.f64 fd529, fd481, fd493;
add.f64 fd530, fd469, fd529;
add.f64 fd531, fd482, fd494;
add.f64 fd532, fd470, fd531;
mul.f64 fd533, fd529, 0d3FE0000000000000;
sub.f64 fd534, fd469, fd533;
sub.f64 fd535, fd482, fd494;
mul.f64 fd536, fd535, 0d3FEBB67AE8584CAA;
add.f64 fd537, fd536, fd534;
sub.f64 fd538, fd534, fd536;
mul.f64 fd539, fd531, 0d3FE0000000000000;
sub.f64 fd540, fd470, fd539;
sub.f64 fd541, fd481, fd493;
mul.f64 fd542, fd541, 0d3FEBB67AE8584CAA;
sub.f64 fd543, fd540, fd542;
add.f64 fd544, fd542, fd540;
mul.f64 fd545, fd521, 0d3FE8836FA2CF5039;
mul.f64 fd546, fd527, 0dBFE491B7523C161D;
sub.f64 fd547, fd545, fd546;
mul.f64 fd548, fd527, 0d3FE8836FA2CF5039;
fma.rn.f64 fd549, fd521, 0dBFE491B7523C161D, fd548;
mul.f64 fd550, fd537, 0d3FC63A1A7E0B738A;
mul.f64 fd551, fd543, 0dBFEF838B8C811C17;
sub.f64 fd552, fd550, fd551;
mul.f64 fd553, fd543, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd554, fd537, 0dBFEF838B8C811C17, fd553;
mul.f64 fd555, fd522, 0d3FC63A1A7E0B738A;
mul.f64 fd556, fd528, 0dBFEF838B8C811C17;
sub.f64 fd557, fd555, fd556;
mul.f64 fd558, fd528, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd559, fd522, 0dBFEF838B8C811C17, fd558;
mul.f64 fd560, fd538, 0dBFEE11F642522D1C;
mul.f64 fd561, fd544, 0dBFD5E3A8748A0BF5;
sub.f64 fd562, fd560, fd561;
mul.f64 fd563, fd544, 0dBFEE11F642522D1C;
fma.rn.f64 fd564, fd538, 0dBFD5E3A8748A0BF5, fd563;
add.f64 fd565, fd514, fd530;
add.f64 fd566, fd516, fd532;
mul.f64 fd567, fd565, 0d3FE0000000000000;
sub.f64 fd568, fd498, fd567;
sub.f64 fd569, fd516, fd532;
mul.f64 fd570, fd569, 0d3FEBB67AE8584CAA;
mul.f64 fd571, fd566, 0d3FE0000000000000;
sub.f64 fd572, fd500, fd571;
sub.f64 fd573, fd514, fd530;
mul.f64 fd574, fd573, 0d3FEBB67AE8584CAA;
add.f64 fd575, fd547, fd552;
add.f64 fd576, fd549, fd554;
mul.f64 fd577, fd575, 0d3FE0000000000000;
sub.f64 fd578, fd505, fd577;
sub.f64 fd579, fd549, fd554;
mul.f64 fd580, fd579, 0d3FEBB67AE8584CAA;
mul.f64 fd581, fd576, 0d3FE0000000000000;
sub.f64 fd582, fd511, fd581;
sub.f64 fd583, fd547, fd552;
mul.f64 fd584, fd583, 0d3FEBB67AE8584CAA;
add.f64 fd585, fd557, fd562;
add.f64 fd586, fd559, fd564;
mul.f64 fd587, fd585, 0d3FE0000000000000;
sub.f64 fd588, fd506, fd587;
sub.f64 fd589, fd559, fd564;
mul.f64 fd590, fd589, 0d3FEBB67AE8584CAA;
mul.f64 fd591, fd586, 0d3FE0000000000000;
sub.f64 fd592, fd512, fd591;
sub.f64 fd593, fd557, fd562;
mul.f64 fd594, fd593, 0d3FEBB67AE8584CAA;
add.f64 %1, fd500, fd566;
add.f64 %0, fd498, fd565;
add.f64 %3, fd511, fd576;
add.f64 %2, fd505, fd575;
add.f64 %5, fd512, fd586;
add.f64 %4, fd506, fd585;
sub.f64 %7, fd572, fd574;
add.f64 %6, fd570, fd568;
sub.f64 %9, fd582, fd584;
add.f64 %8, fd580, fd578;
sub.f64 %11, fd592, fd594;
add.f64 %10, fd590, fd588;
add.f64 %13, fd574, fd572;
sub.f64 %12, fd568, fd570;
add.f64 %15, fd584, fd582;
sub.f64 %14, fd578, fd580;
add.f64 %17, fd594, fd592;
sub.f64 %16, fd588, fd590;
})"
     : "=d"(rmem[0].x), "=d"(rmem[0].y), "=d"(rmem[1].x), "=d"(rmem[1].y), "=d"(rmem[2].x), "=d"(rmem[2].y), "=d"(rmem[3].x), "=d"(rmem[3].y), "=d"(rmem[4].x), "=d"(rmem[4].y), "=d"(rmem[5].x), "=d"(rmem[5].y), "=d"(rmem[6].x), "=d"(rmem[6].y), "=d"(rmem[7].x), "=d"(rmem[7].y), "=d"(rmem[8].x), "=d"(rmem[8].y): "r"(smem), "l"(lut_dp_9_729), "l"(lut_dp_9_81), "d"(rmem[0].x), "d"(rmem[0].y), "d"(rmem[1].x), "d"(rmem[1].y), "d"(rmem[1].y), "d"(rmem[2].x), "d"(rmem[2].y), "d"(rmem[2].y), "d"(rmem[3].x), "d"(rmem[3].y), "d"(rmem[4].x), "d"(rmem[4].y), "d"(rmem[4].y), "d"(rmem[5].x), "d"(rmem[5].y), "d"(rmem[5].y), "d"(rmem[6].x), "d"(rmem[6].y), "d"(rmem[7].x), "d"(rmem[7].y), "d"(rmem[7].y), "d"(rmem[8].x), "d"(rmem[8].y));
};




template<> __forceinline__ __device__ void cufftdx_private_function<522, double, 1>(cufftdx::detail::complex<double> *rmem, unsigned smem){

asm volatile (R"({
.reg .b32 r<18>;
.reg .f64 fd<577>;
.reg .b64 rd<12>;
mov.u32 r1, %tid.y;
mov.u32 r2, %18;
mad.lo.s32 r3, r1, 5832, r2;
add.f64 fd37, %29, %37;
add.f64 fd38, %21, fd37;
add.f64 fd39, %30, %38;
add.f64 fd40, %22, fd39;
mul.f64 fd41, fd37, 0d3FE0000000000000;
sub.f64 fd42, %21, fd41;
sub.f64 fd43, %30, %38;
mul.f64 fd44, fd43, 0d3FEBB67AE8584CAA;
add.f64 fd45, fd44, fd42;
sub.f64 fd46, fd42, fd44;
mul.f64 fd47, fd39, 0d3FE0000000000000;
sub.f64 fd48, %22, fd47;
sub.f64 fd49, %29, %37;
mul.f64 fd50, fd49, 0d3FEBB67AE8584CAA;
sub.f64 fd51, fd48, fd50;
add.f64 fd52, fd50, fd48;
add.f64 fd53, %31, %39;
add.f64 fd54, %23, fd53;
add.f64 fd55, %33, %41;
add.f64 fd56, %25, fd55;
mul.f64 fd57, fd53, 0d3FE0000000000000;
sub.f64 fd58, %23, fd57;
sub.f64 fd59, %33, %41;
mul.f64 fd60, fd59, 0d3FEBB67AE8584CAA;
add.f64 fd61, fd60, fd58;
sub.f64 fd62, fd58, fd60;
mul.f64 fd63, fd55, 0d3FE0000000000000;
sub.f64 fd64, %25, fd63;
sub.f64 fd65, %31, %39;
mul.f64 fd66, fd65, 0d3FEBB67AE8584CAA;
sub.f64 fd67, fd64, fd66;
add.f64 fd68, fd66, fd64;
add.f64 fd69, %34, %42;
add.f64 fd70, %26, fd69;
add.f64 fd71, %36, %43;
add.f64 fd72, %28, fd71;
mul.f64 fd73, fd69, 0d3FE0000000000000;
sub.f64 fd74, %26, fd73;
sub.f64 fd75, %36, %43;
mul.f64 fd76, fd75, 0d3FEBB67AE8584CAA;
add.f64 fd77, fd76, fd74;
sub.f64 fd78, fd74, fd76;
mul.f64 fd79, fd71, 0d3FE0000000000000;
sub.f64 fd80, %28, fd79;
sub.f64 fd81, %34, %42;
mul.f64 fd82, fd81, 0d3FEBB67AE8584CAA;
sub.f64 fd83, fd80, fd82;
add.f64 fd84, fd82, fd80;
mov.u32 r4, %tid.x;
mul.f64 fd85, fd61, 0d3FE8836FA2CF5039;
mul.f64 fd86, fd67, 0dBFE491B7523C161D;
sub.f64 fd87, fd85, fd86;
mul.f64 fd88, fd67, 0d3FE8836FA2CF5039;
fma.rn.f64 fd89, fd61, 0dBFE491B7523C161D, fd88;
mul.f64 fd90, fd77, 0d3FC63A1A7E0B738A;
mul.f64 fd91, fd83, 0dBFEF838B8C811C17;
sub.f64 fd92, fd90, fd91;
mul.f64 fd93, fd83, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd94, fd77, 0dBFEF838B8C811C17, fd93;
mul.f64 fd95, fd62, 0d3FC63A1A7E0B738A;
mul.f64 fd96, fd68, 0dBFEF838B8C811C17;
sub.f64 fd97, fd95, fd96;
mul.f64 fd98, fd68, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd99, fd62, 0dBFEF838B8C811C17, fd98;
mul.f64 fd100, fd78, 0dBFEE11F642522D1C;
mul.f64 fd101, fd84, 0dBFD5E3A8748A0BF5;
sub.f64 fd102, fd100, fd101;
mul.f64 fd103, fd84, 0dBFEE11F642522D1C;
fma.rn.f64 fd104, fd78, 0dBFD5E3A8748A0BF5, fd103;
add.f64 fd105, fd54, fd70;
add.f64 fd106, fd38, fd105;
add.f64 fd107, fd56, fd72;
add.f64 fd108, fd40, fd107;
mul.f64 fd109, fd105, 0d3FE0000000000000;
sub.f64 fd110, fd38, fd109;
sub.f64 fd111, fd56, fd72;
mul.f64 fd112, fd111, 0d3FEBB67AE8584CAA;
add.f64 fd113, fd112, fd110;
sub.f64 fd114, fd110, fd112;
mul.f64 fd115, fd107, 0d3FE0000000000000;
sub.f64 fd116, fd40, fd115;
sub.f64 fd117, fd54, fd70;
mul.f64 fd118, fd117, 0d3FEBB67AE8584CAA;
sub.f64 fd119, fd116, fd118;
add.f64 fd120, fd118, fd116;
add.f64 fd121, fd87, fd92;
add.f64 fd122, fd45, fd121;
add.f64 fd123, fd89, fd94;
add.f64 fd124, fd51, fd123;
mul.f64 fd125, fd121, 0d3FE0000000000000;
sub.f64 fd126, fd45, fd125;
sub.f64 fd127, fd89, fd94;
mul.f64 fd128, fd127, 0d3FEBB67AE8584CAA;
add.f64 fd129, fd128, fd126;
sub.f64 fd130, fd126, fd128;
mul.f64 fd131, fd123, 0d3FE0000000000000;
sub.f64 fd132, fd51, fd131;
sub.f64 fd133, fd87, fd92;
mul.f64 fd134, fd133, 0d3FEBB67AE8584CAA;
sub.f64 fd135, fd132, fd134;
add.f64 fd136, fd134, fd132;
add.f64 fd137, fd97, fd102;
add.f64 fd138, fd46, fd137;
add.f64 fd139, fd99, fd104;
add.f64 fd140, fd52, fd139;
mul.f64 fd141, fd137, 0d3FE0000000000000;
sub.f64 fd142, fd46, fd141;
sub.f64 fd143, fd99, fd104;
mul.f64 fd144, fd143, 0d3FEBB67AE8584CAA;
add.f64 fd145, fd144, fd142;
sub.f64 fd146, fd142, fd144;
mul.f64 fd147, fd139, 0d3FE0000000000000;
sub.f64 fd148, fd52, fd147;
sub.f64 fd149, fd97, fd102;
mul.f64 fd150, fd149, 0d3FEBB67AE8584CAA;
sub.f64 fd151, fd148, fd150;
add.f64 fd152, fd150, fd148;
mul.wide.u32 rd2, r4, -901412889;
shr.u64 rd3, rd2, 38;
cvt.u32.u64 r5, rd3;
mul.lo.s32 r6, r5, 81;
sub.s32 r7, r4, r6;
mul.wide.u32 rd4, r7, 16;
mov.u64 rd5, %19;
add.s64 rd6, rd5, rd4;
ld.global.v2.f64 {fd153, fd154}, [rd6];
mul.f64 fd157, fd153, fd122;
mul.f64 fd158, fd154, fd124;
sub.f64 fd159, fd157, fd158;
mul.f64 fd160, fd153, fd124;
fma.rn.f64 fd161, fd154, fd122, fd160;
mul.f64 fd162, fd153, fd153;
mul.f64 fd163, fd154, fd154;
sub.f64 fd164, fd162, fd163;
mul.f64 fd165, fd154, fd153;
fma.rn.f64 fd166, fd154, fd153, fd165;
mul.f64 fd167, fd164, fd138;
mul.f64 fd168, fd166, fd140;
sub.f64 fd169, fd167, fd168;
mul.f64 fd170, fd164, fd140;
fma.rn.f64 fd171, fd166, fd138, fd170;
mul.f64 fd172, fd153, fd164;
mul.f64 fd173, fd154, fd166;
sub.f64 fd174, fd172, fd173;
mul.f64 fd175, fd153, fd166;
fma.rn.f64 fd176, fd154, fd164, fd175;
mul.f64 fd177, fd174, fd113;
mul.f64 fd178, fd176, fd119;
sub.f64 fd179, fd177, fd178;
mul.f64 fd180, fd174, fd119;
fma.rn.f64 fd181, fd176, fd113, fd180;
mul.f64 fd182, fd153, fd174;
mul.f64 fd183, fd154, fd176;
sub.f64 fd184, fd182, fd183;
mul.f64 fd185, fd153, fd176;
fma.rn.f64 fd186, fd154, fd174, fd185;
mul.f64 fd187, fd184, fd129;
mul.f64 fd188, fd186, fd135;
sub.f64 fd189, fd187, fd188;
mul.f64 fd190, fd184, fd135;
fma.rn.f64 fd191, fd186, fd129, fd190;
ld.global.v2.f64 {fd192, fd193}, [rd6+1296];
mul.f64 fd196, fd192, fd145;
mul.f64 fd197, fd193, fd151;
sub.f64 fd198, fd196, fd197;
mul.f64 fd199, fd192, fd151;
fma.rn.f64 fd200, fd193, fd145, fd199;
mul.f64 fd201, fd153, fd192;
mul.f64 fd202, fd154, fd193;
sub.f64 fd203, fd201, fd202;
mul.f64 fd204, fd153, fd193;
fma.rn.f64 fd205, fd154, fd192, fd204;
mul.f64 fd206, fd203, fd114;
mul.f64 fd207, fd205, fd120;
sub.f64 fd208, fd206, fd207;
mul.f64 fd209, fd203, fd120;
fma.rn.f64 fd210, fd205, fd114, fd209;
mul.f64 fd211, fd153, fd203;
mul.f64 fd212, fd154, fd205;
sub.f64 fd213, fd211, fd212;
mul.f64 fd214, fd153, fd205;
fma.rn.f64 fd215, fd154, fd203, fd214;
mul.f64 fd216, fd213, fd130;
mul.f64 fd217, fd215, fd136;
sub.f64 fd218, fd216, fd217;
mul.f64 fd219, fd213, fd136;
fma.rn.f64 fd220, fd215, fd130, fd219;
mul.f64 fd221, fd153, fd213;
mul.f64 fd222, fd154, fd215;
sub.f64 fd223, fd221, fd222;
mul.f64 fd224, fd153, fd215;
fma.rn.f64 fd225, fd154, fd213, fd224;
mul.f64 fd226, fd223, fd146;
mul.f64 fd227, fd225, fd152;
sub.f64 fd228, fd226, fd227;
mul.f64 fd229, fd223, fd152;
fma.rn.f64 fd230, fd225, fd146, fd229;
mad.lo.s32 r8, r5, 5832, r3;
barrier.sync 0;
mad.lo.s32 r9, r7, 72, r8;
st.shared.f64 [r9], fd106;
st.shared.f64 [r9+8], fd159;
st.shared.f64 [r9+16], fd169;
st.shared.f64 [r9+24], fd179;
st.shared.f64 [r9+32], fd189;
st.shared.f64 [r9+40], fd198;
st.shared.f64 [r9+48], fd208;
st.shared.f64 [r9+56], fd218;
st.shared.f64 [r9+64], fd228;
barrier.sync 0;
shl.b32 r10, r7, 6;
sub.s32 r11, r9, r10;
ld.shared.f64 fd231, [r11];
ld.shared.f64 fd232, [r11+648];
ld.shared.f64 fd233, [r11+1296];
ld.shared.f64 fd234, [r11+1944];
ld.shared.f64 fd235, [r11+2592];
ld.shared.f64 fd236, [r11+3240];
ld.shared.f64 fd237, [r11+3888];
ld.shared.f64 fd238, [r11+4536];
ld.shared.f64 fd239, [r11+5184];
barrier.sync 0;
st.shared.f64 [r9], fd108;
st.shared.f64 [r9+8], fd161;
st.shared.f64 [r9+16], fd171;
st.shared.f64 [r9+24], fd181;
st.shared.f64 [r9+32], fd191;
st.shared.f64 [r9+40], fd200;
st.shared.f64 [r9+48], fd210;
st.shared.f64 [r9+56], fd220;
st.shared.f64 [r9+64], fd230;
barrier.sync 0;
ld.shared.f64 fd240, [r11];
ld.shared.f64 fd241, [r11+648];
ld.shared.f64 fd242, [r11+1296];
ld.shared.f64 fd243, [r11+1944];
ld.shared.f64 fd244, [r11+2592];
ld.shared.f64 fd245, [r11+3240];
ld.shared.f64 fd246, [r11+3888];
ld.shared.f64 fd247, [r11+4536];
ld.shared.f64 fd248, [r11+5184];
add.f64 fd249, fd234, fd237;
add.f64 fd250, fd231, fd249;
add.f64 fd251, fd243, fd246;
add.f64 fd252, fd240, fd251;
mul.f64 fd253, fd249, 0d3FE0000000000000;
sub.f64 fd254, fd231, fd253;
sub.f64 fd255, fd243, fd246;
mul.f64 fd256, fd255, 0d3FEBB67AE8584CAA;
add.f64 fd257, fd256, fd254;
sub.f64 fd258, fd254, fd256;
mul.f64 fd259, fd251, 0d3FE0000000000000;
sub.f64 fd260, fd240, fd259;
sub.f64 fd261, fd234, fd237;
mul.f64 fd262, fd261, 0d3FEBB67AE8584CAA;
sub.f64 fd263, fd260, fd262;
add.f64 fd264, fd262, fd260;
add.f64 fd265, fd235, fd238;
add.f64 fd266, fd232, fd265;
add.f64 fd267, fd244, fd247;
add.f64 fd268, fd241, fd267;
mul.f64 fd269, fd265, 0d3FE0000000000000;
sub.f64 fd270, fd232, fd269;
sub.f64 fd271, fd244, fd247;
mul.f64 fd272, fd271, 0d3FEBB67AE8584CAA;
add.f64 fd273, fd272, fd270;
sub.f64 fd274, fd270, fd272;
mul.f64 fd275, fd267, 0d3FE0000000000000;
sub.f64 fd276, fd241, fd275;
sub.f64 fd277, fd235, fd238;
mul.f64 fd278, fd277, 0d3FEBB67AE8584CAA;
sub.f64 fd279, fd276, fd278;
add.f64 fd280, fd278, fd276;
add.f64 fd281, fd236, fd239;
add.f64 fd282, fd233, fd281;
add.f64 fd283, fd245, fd248;
add.f64 fd284, fd242, fd283;
mul.f64 fd285, fd281, 0d3FE0000000000000;
sub.f64 fd286, fd233, fd285;
sub.f64 fd287, fd245, fd248;
mul.f64 fd288, fd287, 0d3FEBB67AE8584CAA;
add.f64 fd289, fd288, fd286;
sub.f64 fd290, fd286, fd288;
mul.f64 fd291, fd283, 0d3FE0000000000000;
sub.f64 fd292, fd242, fd291;
sub.f64 fd293, fd236, fd239;
mul.f64 fd294, fd293, 0d3FEBB67AE8584CAA;
sub.f64 fd295, fd292, fd294;
add.f64 fd296, fd294, fd292;
mul.f64 fd297, fd273, 0d3FE8836FA2CF5039;
mul.f64 fd298, fd279, 0dBFE491B7523C161D;
sub.f64 fd299, fd297, fd298;
mul.f64 fd300, fd279, 0d3FE8836FA2CF5039;
fma.rn.f64 fd301, fd273, 0dBFE491B7523C161D, fd300;
mul.f64 fd302, fd289, 0d3FC63A1A7E0B738A;
mul.f64 fd303, fd295, 0dBFEF838B8C811C17;
sub.f64 fd304, fd302, fd303;
mul.f64 fd305, fd295, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd306, fd289, 0dBFEF838B8C811C17, fd305;
mul.f64 fd307, fd274, 0d3FC63A1A7E0B738A;
mul.f64 fd308, fd280, 0dBFEF838B8C811C17;
sub.f64 fd309, fd307, fd308;
mul.f64 fd310, fd280, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd311, fd274, 0dBFEF838B8C811C17, fd310;
mul.f64 fd312, fd290, 0dBFEE11F642522D1C;
mul.f64 fd313, fd296, 0dBFD5E3A8748A0BF5;
sub.f64 fd314, fd312, fd313;
mul.f64 fd315, fd296, 0dBFEE11F642522D1C;
fma.rn.f64 fd316, fd290, 0dBFD5E3A8748A0BF5, fd315;
add.f64 fd317, fd266, fd282;
add.f64 fd318, fd250, fd317;
add.f64 fd319, fd268, fd284;
add.f64 fd320, fd252, fd319;
mul.f64 fd321, fd317, 0d3FE0000000000000;
sub.f64 fd322, fd250, fd321;
sub.f64 fd323, fd268, fd284;
mul.f64 fd324, fd323, 0d3FEBB67AE8584CAA;
add.f64 fd325, fd324, fd322;
sub.f64 fd326, fd322, fd324;
mul.f64 fd327, fd319, 0d3FE0000000000000;
sub.f64 fd328, fd252, fd327;
sub.f64 fd329, fd266, fd282;
mul.f64 fd330, fd329, 0d3FEBB67AE8584CAA;
sub.f64 fd331, fd328, fd330;
add.f64 fd332, fd330, fd328;
add.f64 fd333, fd299, fd304;
add.f64 fd334, fd257, fd333;
add.f64 fd335, fd301, fd306;
add.f64 fd336, fd263, fd335;
mul.f64 fd337, fd333, 0d3FE0000000000000;
sub.f64 fd338, fd257, fd337;
sub.f64 fd339, fd301, fd306;
mul.f64 fd340, fd339, 0d3FEBB67AE8584CAA;
add.f64 fd341, fd340, fd338;
sub.f64 fd342, fd338, fd340;
mul.f64 fd343, fd335, 0d3FE0000000000000;
sub.f64 fd344, fd263, fd343;
sub.f64 fd345, fd299, fd304;
mul.f64 fd346, fd345, 0d3FEBB67AE8584CAA;
sub.f64 fd347, fd344, fd346;
add.f64 fd348, fd346, fd344;
add.f64 fd349, fd309, fd314;
add.f64 fd350, fd258, fd349;
add.f64 fd351, fd311, fd316;
add.f64 fd352, fd264, fd351;
mul.f64 fd353, fd349, 0d3FE0000000000000;
sub.f64 fd354, fd258, fd353;
sub.f64 fd355, fd311, fd316;
mul.f64 fd356, fd355, 0d3FEBB67AE8584CAA;
add.f64 fd357, fd356, fd354;
sub.f64 fd358, fd354, fd356;
mul.f64 fd359, fd351, 0d3FE0000000000000;
sub.f64 fd360, fd264, fd359;
sub.f64 fd361, fd309, fd314;
mul.f64 fd362, fd361, 0d3FEBB67AE8584CAA;
sub.f64 fd363, fd360, fd362;
add.f64 fd364, fd362, fd360;
mul.wide.u32 rd7, r7, 954437177;
shr.u64 rd8, rd7, 33;
cvt.u32.u64 r12, rd8;
mul.lo.s32 r13, r12, 9;
sub.s32 r14, r7, r13;
mul.wide.u32 rd9, r12, 16;
mov.u64 rd10, %20;
add.s64 rd11, rd10, rd9;
ld.global.v2.f64 {fd365, fd366}, [rd11];
mul.f64 fd369, fd365, fd334;
mul.f64 fd370, fd366, fd336;
sub.f64 fd371, fd369, fd370;
mul.f64 fd372, fd365, fd336;
fma.rn.f64 fd373, fd366, fd334, fd372;
mul.f64 fd374, fd365, fd365;
mul.f64 fd375, fd366, fd366;
sub.f64 fd376, fd374, fd375;
mul.f64 fd377, fd366, fd365;
fma.rn.f64 fd378, fd366, fd365, fd377;
mul.f64 fd379, fd376, fd350;
mul.f64 fd380, fd378, fd352;
sub.f64 fd381, fd379, fd380;
mul.f64 fd382, fd376, fd352;
fma.rn.f64 fd383, fd378, fd350, fd382;
mul.f64 fd384, fd365, fd376;
mul.f64 fd385, fd366, fd378;
sub.f64 fd386, fd384, fd385;
mul.f64 fd387, fd365, fd378;
fma.rn.f64 fd388, fd366, fd376, fd387;
mul.f64 fd389, fd386, fd325;
mul.f64 fd390, fd388, fd331;
sub.f64 fd391, fd389, fd390;
mul.f64 fd392, fd386, fd331;
fma.rn.f64 fd393, fd388, fd325, fd392;
mul.f64 fd394, fd365, fd386;
mul.f64 fd395, fd366, fd388;
sub.f64 fd396, fd394, fd395;
mul.f64 fd397, fd365, fd388;
fma.rn.f64 fd398, fd366, fd386, fd397;
mul.f64 fd399, fd396, fd341;
mul.f64 fd400, fd398, fd347;
sub.f64 fd401, fd399, fd400;
mul.f64 fd402, fd396, fd347;
fma.rn.f64 fd403, fd398, fd341, fd402;
ld.global.v2.f64 {fd404, fd405}, [rd11+144];
mul.f64 fd408, fd404, fd357;
mul.f64 fd409, fd405, fd363;
sub.f64 fd410, fd408, fd409;
mul.f64 fd411, fd404, fd363;
fma.rn.f64 fd412, fd405, fd357, fd411;
mul.f64 fd413, fd365, fd404;
mul.f64 fd414, fd366, fd405;
sub.f64 fd415, fd413, fd414;
mul.f64 fd416, fd365, fd405;
fma.rn.f64 fd417, fd366, fd404, fd416;
mul.f64 fd418, fd415, fd326;
mul.f64 fd419, fd417, fd332;
sub.f64 fd420, fd418, fd419;
mul.f64 fd421, fd415, fd332;
fma.rn.f64 fd422, fd417, fd326, fd421;
mul.f64 fd423, fd365, fd415;
mul.f64 fd424, fd366, fd417;
sub.f64 fd425, fd423, fd424;
mul.f64 fd426, fd365, fd417;
fma.rn.f64 fd427, fd366, fd415, fd426;
mul.f64 fd428, fd425, fd342;
mul.f64 fd429, fd427, fd348;
sub.f64 fd430, fd428, fd429;
mul.f64 fd431, fd425, fd348;
fma.rn.f64 fd432, fd427, fd342, fd431;
mul.f64 fd433, fd365, fd425;
mul.f64 fd434, fd366, fd427;
sub.f64 fd435, fd433, fd434;
mul.f64 fd436, fd365, fd427;
fma.rn.f64 fd437, fd366, fd425, fd436;
mul.f64 fd438, fd435, fd358;
mul.f64 fd439, fd437, fd364;
sub.f64 fd440, fd438, fd439;
mul.f64 fd441, fd435, fd364;
fma.rn.f64 fd442, fd437, fd358, fd441;
shl.b32 r15, r14, 3;
add.s32 r16, r8, r15;
barrier.sync 0;
mad.lo.s32 r17, r12, 648, r16;
st.shared.f64 [r17], fd318;
st.shared.f64 [r17+72], fd371;
st.shared.f64 [r17+144], fd381;
st.shared.f64 [r17+216], fd391;
st.shared.f64 [r17+288], fd401;
st.shared.f64 [r17+360], fd410;
st.shared.f64 [r17+432], fd420;
st.shared.f64 [r17+504], fd430;
st.shared.f64 [r17+576], fd440;
barrier.sync 0;
ld.shared.f64 fd443, [r11];
ld.shared.f64 fd444, [r11+648];
ld.shared.f64 fd445, [r11+1296];
ld.shared.f64 fd446, [r11+1944];
ld.shared.f64 fd447, [r11+2592];
ld.shared.f64 fd448, [r11+3240];
ld.shared.f64 fd449, [r11+3888];
ld.shared.f64 fd450, [r11+4536];
ld.shared.f64 fd451, [r11+5184];
barrier.sync 0;
st.shared.f64 [r17], fd320;
st.shared.f64 [r17+72], fd373;
st.shared.f64 [r17+144], fd383;
st.shared.f64 [r17+216], fd393;
st.shared.f64 [r17+288], fd403;
st.shared.f64 [r17+360], fd412;
st.shared.f64 [r17+432], fd422;
st.shared.f64 [r17+504], fd432;
st.shared.f64 [r17+576], fd442;
barrier.sync 0;
ld.shared.f64 fd452, [r11];
ld.shared.f64 fd453, [r11+648];
ld.shared.f64 fd454, [r11+1296];
ld.shared.f64 fd455, [r11+1944];
ld.shared.f64 fd456, [r11+2592];
ld.shared.f64 fd457, [r11+3240];
ld.shared.f64 fd458, [r11+3888];
ld.shared.f64 fd459, [r11+4536];
ld.shared.f64 fd460, [r11+5184];
add.f64 fd461, fd446, fd449;
add.f64 fd462, fd443, fd461;
add.f64 fd463, fd455, fd458;
add.f64 fd464, fd452, fd463;
mul.f64 fd465, fd461, 0d3FE0000000000000;
sub.f64 fd466, fd443, fd465;
sub.f64 fd467, fd455, fd458;
mul.f64 fd468, fd467, 0d3FEBB67AE8584CAA;
add.f64 fd469, fd468, fd466;
sub.f64 fd470, fd466, fd468;
mul.f64 fd471, fd463, 0d3FE0000000000000;
sub.f64 fd472, fd452, fd471;
sub.f64 fd473, fd446, fd449;
mul.f64 fd474, fd473, 0d3FEBB67AE8584CAA;
sub.f64 fd475, fd472, fd474;
add.f64 fd476, fd474, fd472;
add.f64 fd477, fd447, fd450;
add.f64 fd478, fd444, fd477;
add.f64 fd479, fd456, fd459;
add.f64 fd480, fd453, fd479;
mul.f64 fd481, fd477, 0d3FE0000000000000;
sub.f64 fd482, fd444, fd481;
sub.f64 fd483, fd456, fd459;
mul.f64 fd484, fd483, 0d3FEBB67AE8584CAA;
add.f64 fd485, fd484, fd482;
sub.f64 fd486, fd482, fd484;
mul.f64 fd487, fd479, 0d3FE0000000000000;
sub.f64 fd488, fd453, fd487;
sub.f64 fd489, fd447, fd450;
mul.f64 fd490, fd489, 0d3FEBB67AE8584CAA;
sub.f64 fd491, fd488, fd490;
add.f64 fd492, fd490, fd488;
add.f64 fd493, fd448, fd451;
add.f64 fd494, fd445, fd493;
add.f64 fd495, fd457, fd460;
add.f64 fd496, fd454, fd495;
mul.f64 fd497, fd493, 0d3FE0000000000000;
sub.f64 fd498, fd445, fd497;
sub.f64 fd499, fd457, fd460;
mul.f64 fd500, fd499, 0d3FEBB67AE8584CAA;
add.f64 fd501, fd500, fd498;
sub.f64 fd502, fd498, fd500;
mul.f64 fd503, fd495, 0d3FE0000000000000;
sub.f64 fd504, fd454, fd503;
sub.f64 fd505, fd448, fd451;
mul.f64 fd506, fd505, 0d3FEBB67AE8584CAA;
sub.f64 fd507, fd504, fd506;
add.f64 fd508, fd506, fd504;
mul.f64 fd509, fd485, 0d3FE8836FA2CF5039;
mul.f64 fd510, fd491, 0dBFE491B7523C161D;
sub.f64 fd511, fd509, fd510;
mul.f64 fd512, fd491, 0d3FE8836FA2CF5039;
fma.rn.f64 fd513, fd485, 0dBFE491B7523C161D, fd512;
mul.f64 fd514, fd501, 0d3FC63A1A7E0B738A;
mul.f64 fd515, fd507, 0dBFEF838B8C811C17;
sub.f64 fd516, fd514, fd515;
mul.f64 fd517, fd507, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd518, fd501, 0dBFEF838B8C811C17, fd517;
mul.f64 fd519, fd486, 0d3FC63A1A7E0B738A;
mul.f64 fd520, fd492, 0dBFEF838B8C811C17;
sub.f64 fd521, fd519, fd520;
mul.f64 fd522, fd492, 0d3FC63A1A7E0B738A;
fma.rn.f64 fd523, fd486, 0dBFEF838B8C811C17, fd522;
mul.f64 fd524, fd502, 0dBFEE11F642522D1C;
mul.f64 fd525, fd508, 0dBFD5E3A8748A0BF5;
sub.f64 fd526, fd524, fd525;
mul.f64 fd527, fd508, 0dBFEE11F642522D1C;
fma.rn.f64 fd528, fd502, 0dBFD5E3A8748A0BF5, fd527;
add.f64 fd529, fd478, fd494;
add.f64 fd530, fd480, fd496;
mul.f64 fd531, fd529, 0d3FE0000000000000;
sub.f64 fd532, fd462, fd531;
sub.f64 fd533, fd480, fd496;
mul.f64 fd534, fd533, 0d3FEBB67AE8584CAA;
mul.f64 fd535, fd530, 0d3FE0000000000000;
sub.f64 fd536, fd464, fd535;
sub.f64 fd537, fd478, fd494;
mul.f64 fd538, fd537, 0d3FEBB67AE8584CAA;
add.f64 fd539, fd511, fd516;
add.f64 fd540, fd513, fd518;
mul.f64 fd541, fd539, 0d3FE0000000000000;
sub.f64 fd542, fd469, fd541;
sub.f64 fd543, fd513, fd518;
mul.f64 fd544, fd543, 0d3FEBB67AE8584CAA;
mul.f64 fd545, fd540, 0d3FE0000000000000;
sub.f64 fd546, fd475, fd545;
sub.f64 fd547, fd511, fd516;
mul.f64 fd548, fd547, 0d3FEBB67AE8584CAA;
add.f64 fd549, fd521, fd526;
add.f64 fd550, fd523, fd528;
mul.f64 fd551, fd549, 0d3FE0000000000000;
sub.f64 fd552, fd470, fd551;
sub.f64 fd553, fd523, fd528;
mul.f64 fd554, fd553, 0d3FEBB67AE8584CAA;
mul.f64 fd555, fd550, 0d3FE0000000000000;
sub.f64 fd556, fd476, fd555;
sub.f64 fd557, fd521, fd526;
mul.f64 fd558, fd557, 0d3FEBB67AE8584CAA;
add.f64 %0, fd462, fd529;
add.f64 %1, fd464, fd530;
add.f64 %3, fd475, fd540;
add.f64 %2, fd469, fd539;
add.f64 %5, fd476, fd550;
add.f64 %4, fd470, fd549;
add.f64 %6, fd534, fd532;
sub.f64 %7, fd536, fd538;
sub.f64 %9, fd546, fd548;
add.f64 %8, fd544, fd542;
sub.f64 %11, fd556, fd558;
add.f64 %10, fd554, fd552;
sub.f64 %12, fd532, fd534;
add.f64 %13, fd538, fd536;
add.f64 %15, fd548, fd546;
sub.f64 %14, fd542, fd544;
add.f64 %17, fd558, fd556;
sub.f64 %16, fd552, fd554;
})"
     : "=d"(rmem[0].x), "=d"(rmem[0].y), "=d"(rmem[1].x), "=d"(rmem[1].y), "=d"(rmem[2].x), "=d"(rmem[2].y), "=d"(rmem[3].x), "=d"(rmem[3].y), "=d"(rmem[4].x), "=d"(rmem[4].y), "=d"(rmem[5].x), "=d"(rmem[5].y), "=d"(rmem[6].x), "=d"(rmem[6].y), "=d"(rmem[7].x), "=d"(rmem[7].y), "=d"(rmem[8].x), "=d"(rmem[8].y): "r"(smem), "l"(lut_dp_9_729), "l"(lut_dp_9_81), "d"(rmem[0].x), "d"(rmem[0].y), "d"(rmem[1].x), "d"(rmem[1].y), "d"(rmem[1].y), "d"(rmem[2].x), "d"(rmem[2].y), "d"(rmem[2].y), "d"(rmem[3].x), "d"(rmem[3].y), "d"(rmem[4].x), "d"(rmem[4].y), "d"(rmem[4].y), "d"(rmem[5].x), "d"(rmem[5].y), "d"(rmem[5].y), "d"(rmem[6].x), "d"(rmem[6].y), "d"(rmem[7].x), "d"(rmem[7].y), "d"(rmem[7].y), "d"(rmem[8].x), "d"(rmem[8].y));
};




template<> __forceinline__ __device__ void cufftdx_private_function<525, double, 1>(cufftdx::detail::complex<double> *rmem, unsigned smem){

asm volatile (R"({
.reg .b32 r<40>;
.reg .f64 fd<229>;
.reg .b64 rd<27>;
mov.u32 r1, %tid.y;
mov.u32 r2, %6;
mad.lo.s32 r3, r1, 5832, r2;
mov.u32 r4, %tid.x;
add.f64 fd13, %14, %17;
add.f64 fd14, %12, fd13;
add.f64 fd15, %16, %18;
add.f64 fd16, %13, fd15;
mul.f64 fd17, fd13, 0d3FE0000000000000;
sub.f64 fd18, %12, fd17;
sub.f64 fd19, %16, %18;
mul.f64 fd20, fd19, 0d3FEBB67AE8584CAA;
add.f64 fd21, fd20, fd18;
sub.f64 fd22, fd18, fd20;
mul.f64 fd23, fd15, 0d3FE0000000000000;
sub.f64 fd24, %13, fd23;
sub.f64 fd25, %14, %17;
mul.f64 fd26, fd25, 0d3FEBB67AE8584CAA;
sub.f64 fd27, fd24, fd26;
add.f64 fd28, fd26, fd24;
mul.wide.u32 rd2, r4, -2032597691;
shr.u64 rd3, rd2, 39;
cvt.u32.u64 r5, rd3;
mul.lo.s32 r6, r5, 243;
sub.s32 r7, r4, r6;
mad.lo.s32 r8, r5, 5832, r3;
mul.wide.u32 rd4, r7, 16;
mov.u64 rd5, %7;
add.s64 rd6, rd5, rd4;
ld.global.v2.f64 {fd29, fd30}, [rd6];
mul.f64 fd33, fd29, fd21;
mul.f64 fd34, fd30, fd27;
sub.f64 fd35, fd33, fd34;
mul.f64 fd36, fd29, fd27;
fma.rn.f64 fd37, fd30, fd21, fd36;
ld.global.v2.f64 {fd38, fd39}, [rd6+3888];
mul.f64 fd42, fd38, fd22;
mul.f64 fd43, fd39, fd28;
sub.f64 fd44, fd42, fd43;
mul.f64 fd45, fd38, fd28;
fma.rn.f64 fd46, fd39, fd22, fd45;
barrier.sync 0;
mad.lo.s32 r9, r7, 24, r8;
st.shared.f64 [r9], fd14;
st.shared.f64 [r9+8], fd35;
st.shared.f64 [r9+16], fd44;
barrier.sync 0;
shl.b32 r10, r7, 4;
sub.s32 r11, r9, r10;
ld.shared.f64 fd47, [r11];
ld.shared.f64 fd48, [r11+1944];
ld.shared.f64 fd49, [r11+3888];
barrier.sync 0;
st.shared.f64 [r9], fd16;
st.shared.f64 [r9+8], fd37;
st.shared.f64 [r9+16], fd46;
barrier.sync 0;
ld.shared.f64 fd50, [r11];
ld.shared.f64 fd51, [r11+1944];
ld.shared.f64 fd52, [r11+3888];
add.f64 fd53, fd48, fd49;
add.f64 fd54, fd47, fd53;
add.f64 fd55, fd51, fd52;
add.f64 fd56, fd50, fd55;
mul.f64 fd57, fd53, 0d3FE0000000000000;
sub.f64 fd58, fd47, fd57;
sub.f64 fd59, fd51, fd52;
mul.f64 fd60, fd59, 0d3FEBB67AE8584CAA;
add.f64 fd61, fd60, fd58;
sub.f64 fd62, fd58, fd60;
mul.f64 fd63, fd55, 0d3FE0000000000000;
sub.f64 fd64, fd50, fd63;
sub.f64 fd65, fd48, fd49;
mul.f64 fd66, fd65, 0d3FEBB67AE8584CAA;
sub.f64 fd67, fd64, fd66;
add.f64 fd68, fd66, fd64;
mul.wide.u32 rd7, r7, -1431655765;
shr.u64 rd8, rd7, 33;
cvt.u32.u64 r12, rd8;
mul.lo.s32 r13, r12, 3;
sub.s32 r14, r7, r13;
shl.b32 r15, r14, 3;
add.s32 r16, r8, r15;
mul.wide.u32 rd9, r12, 16;
mov.u64 rd10, %8;
add.s64 rd11, rd10, rd9;
ld.global.v2.f64 {fd69, fd70}, [rd11];
mul.f64 fd73, fd69, fd61;
mul.f64 fd74, fd70, fd67;
sub.f64 fd75, fd73, fd74;
mul.f64 fd76, fd69, fd67;
fma.rn.f64 fd77, fd70, fd61, fd76;
ld.global.v2.f64 {fd78, fd79}, [rd11+1296];
mul.f64 fd82, fd78, fd62;
mul.f64 fd83, fd79, fd68;
sub.f64 fd84, fd82, fd83;
mul.f64 fd85, fd78, fd68;
fma.rn.f64 fd86, fd79, fd62, fd85;
barrier.sync 0;
mad.lo.s32 r17, r12, 72, r16;
st.shared.f64 [r17], fd54;
st.shared.f64 [r17+24], fd75;
st.shared.f64 [r17+48], fd84;
barrier.sync 0;
ld.shared.f64 fd87, [r11];
ld.shared.f64 fd88, [r11+1944];
ld.shared.f64 fd89, [r11+3888];
barrier.sync 0;
st.shared.f64 [r17], fd56;
st.shared.f64 [r17+24], fd77;
st.shared.f64 [r17+48], fd86;
barrier.sync 0;
ld.shared.f64 fd90, [r11];
ld.shared.f64 fd91, [r11+1944];
ld.shared.f64 fd92, [r11+3888];
add.f64 fd93, fd88, fd89;
add.f64 fd94, fd87, fd93;
add.f64 fd95, fd91, fd92;
add.f64 fd96, fd90, fd95;
mul.f64 fd97, fd93, 0d3FE0000000000000;
sub.f64 fd98, fd87, fd97;
sub.f64 fd99, fd91, fd92;
mul.f64 fd100, fd99, 0d3FEBB67AE8584CAA;
add.f64 fd101, fd100, fd98;
sub.f64 fd102, fd98, fd100;
mul.f64 fd103, fd95, 0d3FE0000000000000;
sub.f64 fd104, fd90, fd103;
sub.f64 fd105, fd88, fd89;
mul.f64 fd106, fd105, 0d3FEBB67AE8584CAA;
sub.f64 fd107, fd104, fd106;
add.f64 fd108, fd106, fd104;
mul.wide.u32 rd12, r7, 954437177;
shr.u64 rd13, rd12, 33;
cvt.u32.u64 r18, rd13;
mul.lo.s32 r19, r18, 9;
sub.s32 r20, r7, r19;
shl.b32 r21, r20, 3;
add.s32 r22, r8, r21;
mul.wide.u32 rd14, r18, 16;
mov.u64 rd15, %9;
add.s64 rd16, rd15, rd14;
ld.global.v2.f64 {fd109, fd110}, [rd16];
mul.f64 fd113, fd109, fd101;
mul.f64 fd114, fd110, fd107;
sub.f64 fd115, fd113, fd114;
mul.f64 fd116, fd109, fd107;
fma.rn.f64 fd117, fd110, fd101, fd116;
ld.global.v2.f64 {fd118, fd119}, [rd16+432];
mul.f64 fd122, fd118, fd102;
mul.f64 fd123, fd119, fd108;
sub.f64 fd124, fd122, fd123;
mul.f64 fd125, fd118, fd108;
fma.rn.f64 fd126, fd119, fd102, fd125;
barrier.sync 0;
mad.lo.s32 r23, r18, 216, r22;
st.shared.f64 [r23], fd94;
st.shared.f64 [r23+72], fd115;
st.shared.f64 [r23+144], fd124;
barrier.sync 0;
ld.shared.f64 fd127, [r11];
ld.shared.f64 fd128, [r11+1944];
ld.shared.f64 fd129, [r11+3888];
barrier.sync 0;
st.shared.f64 [r23], fd96;
st.shared.f64 [r23+72], fd117;
st.shared.f64 [r23+144], fd126;
barrier.sync 0;
ld.shared.f64 fd130, [r11];
ld.shared.f64 fd131, [r11+1944];
ld.shared.f64 fd132, [r11+3888];
add.f64 fd133, fd128, fd129;
add.f64 fd134, fd127, fd133;
add.f64 fd135, fd131, fd132;
add.f64 fd136, fd130, fd135;
mul.f64 fd137, fd133, 0d3FE0000000000000;
sub.f64 fd138, fd127, fd137;
sub.f64 fd139, fd131, fd132;
mul.f64 fd140, fd139, 0d3FEBB67AE8584CAA;
add.f64 fd141, fd140, fd138;
sub.f64 fd142, fd138, fd140;
mul.f64 fd143, fd135, 0d3FE0000000000000;
sub.f64 fd144, fd130, fd143;
sub.f64 fd145, fd128, fd129;
mul.f64 fd146, fd145, 0d3FEBB67AE8584CAA;
sub.f64 fd147, fd144, fd146;
add.f64 fd148, fd146, fd144;
mul.wide.u32 rd17, r7, 795364315;
shr.u64 rd18, rd17, 32;
cvt.u32.u64 r24, rd18;
sub.s32 r25, r7, r24;
shr.u32 r26, r25, 1;
add.s32 r27, r26, r24;
shr.u32 r28, r27, 4;
mul.lo.s32 r29, r28, 27;
sub.s32 r30, r7, r29;
shl.b32 r31, r30, 3;
add.s32 r32, r8, r31;
mul.wide.u32 rd19, r28, 16;
mov.u64 rd20, %10;
add.s64 rd21, rd20, rd19;
ld.global.v2.f64 {fd149, fd150}, [rd21];
mul.f64 fd153, fd149, fd141;
mul.f64 fd154, fd150, fd147;
sub.f64 fd155, fd153, fd154;
mul.f64 fd156, fd149, fd147;
fma.rn.f64 fd157, fd150, fd141, fd156;
ld.global.v2.f64 {fd158, fd159}, [rd21+144];
mul.f64 fd162, fd158, fd142;
mul.f64 fd163, fd159, fd148;
sub.f64 fd164, fd162, fd163;
mul.f64 fd165, fd158, fd148;
fma.rn.f64 fd166, fd159, fd142, fd165;
barrier.sync 0;
mad.lo.s32 r33, r28, 648, r32;
st.shared.f64 [r33], fd134;
st.shared.f64 [r33+216], fd155;
st.shared.f64 [r33+432], fd164;
barrier.sync 0;
ld.shared.f64 fd167, [r11];
ld.shared.f64 fd168, [r11+1944];
ld.shared.f64 fd169, [r11+3888];
barrier.sync 0;
st.shared.f64 [r33], fd136;
st.shared.f64 [r33+216], fd157;
st.shared.f64 [r33+432], fd166;
barrier.sync 0;
ld.shared.f64 fd170, [r11];
ld.shared.f64 fd171, [r11+1944];
ld.shared.f64 fd172, [r11+3888];
add.f64 fd173, fd168, fd169;
add.f64 fd174, fd167, fd173;
add.f64 fd175, fd171, fd172;
add.f64 fd176, fd170, fd175;
mul.f64 fd177, fd173, 0d3FE0000000000000;
sub.f64 fd178, fd167, fd177;
sub.f64 fd179, fd171, fd172;
mul.f64 fd180, fd179, 0d3FEBB67AE8584CAA;
add.f64 fd181, fd180, fd178;
sub.f64 fd182, fd178, fd180;
mul.f64 fd183, fd175, 0d3FE0000000000000;
sub.f64 fd184, fd170, fd183;
sub.f64 fd185, fd168, fd169;
mul.f64 fd186, fd185, 0d3FEBB67AE8584CAA;
sub.f64 fd187, fd184, fd186;
add.f64 fd188, fd186, fd184;
mul.wide.u32 rd22, r7, -901412889;
shr.u64 rd23, rd22, 38;
cvt.u32.u64 r34, rd23;
mul.lo.s32 r35, r34, 81;
sub.s32 r36, r7, r35;
shl.b32 r37, r36, 3;
add.s32 r38, r8, r37;
mul.wide.u32 rd24, r34, 16;
mov.u64 rd25, %11;
add.s64 rd26, rd25, rd24;
ld.global.v2.f64 {fd189, fd190}, [rd26];
mul.f64 fd193, fd189, fd181;
mul.f64 fd194, fd190, fd187;
sub.f64 fd195, fd193, fd194;
mul.f64 fd196, fd189, fd187;
fma.rn.f64 fd197, fd190, fd181, fd196;
ld.global.v2.f64 {fd198, fd199}, [rd26+48];
mul.f64 fd202, fd198, fd182;
mul.f64 fd203, fd199, fd188;
sub.f64 fd204, fd202, fd203;
mul.f64 fd205, fd198, fd188;
fma.rn.f64 fd206, fd199, fd182, fd205;
barrier.sync 0;
mad.lo.s32 r39, r34, 1944, r38;
st.shared.f64 [r39], fd174;
st.shared.f64 [r39+648], fd195;
st.shared.f64 [r39+1296], fd204;
barrier.sync 0;
ld.shared.f64 fd207, [r11];
ld.shared.f64 fd208, [r11+1944];
ld.shared.f64 fd209, [r11+3888];
barrier.sync 0;
st.shared.f64 [r39], fd176;
st.shared.f64 [r39+648], fd197;
st.shared.f64 [r39+1296], fd206;
barrier.sync 0;
ld.shared.f64 fd210, [r11];
ld.shared.f64 fd211, [r11+1944];
ld.shared.f64 fd212, [r11+3888];
add.f64 fd213, fd208, fd209;
add.f64 fd214, fd211, fd212;
mul.f64 fd215, fd213, 0d3FE0000000000000;
sub.f64 fd216, fd207, fd215;
sub.f64 fd217, fd211, fd212;
mul.f64 fd218, fd217, 0d3FEBB67AE8584CAA;
mul.f64 fd219, fd214, 0d3FE0000000000000;
sub.f64 fd220, fd210, fd219;
sub.f64 fd221, fd208, fd209;
mul.f64 fd222, fd221, 0d3FEBB67AE8584CAA;
add.f64 %0, fd207, fd213;
add.f64 %1, fd210, fd214;
add.f64 %2, fd218, fd216;
sub.f64 %3, fd220, fd222;
sub.f64 %4, fd216, fd218;
add.f64 %5, fd222, fd220;
})"
     : "=d"(rmem[0].x), "=d"(rmem[0].y), "=d"(rmem[1].x), "=d"(rmem[1].y), "=d"(rmem[2].x), "=d"(rmem[2].y): "r"(smem), "l"(lut_dp_3_729), "l"(lut_dp_3_243), "l"(lut_dp_3_81), "l"(lut_dp_3_27), "l"(lut_dp_3_9), "d"(rmem[0].x), "d"(rmem[0].y), "d"(rmem[1].x), "d"(rmem[1].y), "d"(rmem[1].y), "d"(rmem[2].x), "d"(rmem[2].y));
};




template<> __forceinline__ __device__ void cufftdx_private_function<526, double, 1>(cufftdx::detail::complex<double> *rmem, unsigned smem){

asm volatile (R"({
.reg .b32 r<40>;
.reg .f64 fd<259>;
.reg .b64 rd<27>;
mov.u32 r1, %tid.y;
mov.u32 r2, %6;
mad.lo.s32 r3, r1, 11664, r2;
mov.u32 r4, %tid.x;
add.f64 fd13, %14, %17;
add.f64 fd14, %16, %18;
mul.f64 fd15, fd13, 0d3FE0000000000000;
sub.f64 fd16, %12, fd15;
sub.f64 fd17, %16, %18;
mul.f64 fd18, fd17, 0d3FEBB67AE8584CAA;
add.f64 fd19, fd18, fd16;
sub.f64 fd20, fd16, fd18;
mul.f64 fd21, fd14, 0d3FE0000000000000;
sub.f64 fd22, %13, fd21;
sub.f64 fd23, %14, %17;
mul.f64 fd24, fd23, 0d3FEBB67AE8584CAA;
sub.f64 fd25, fd22, fd24;
add.f64 fd26, fd24, fd22;
mul.wide.u32 rd2, r4, -2032597691;
shr.u64 rd3, rd2, 39;
cvt.u32.u64 r5, rd3;
mul.lo.s32 r6, r5, 243;
sub.s32 r7, r4, r6;
mad.lo.s32 r8, r5, 11664, r3;
mul.wide.u32 rd4, r7, 16;
mov.u64 rd5, %7;
add.s64 rd6, rd5, rd4;
ld.global.v2.f64 {fd27, fd28}, [rd6];
mul.f64 fd31, fd27, fd19;
mul.f64 fd32, fd28, fd25;
mul.f64 fd33, fd27, fd25;
ld.global.v2.f64 {fd34, fd35}, [rd6+3888];
mul.f64 fd38, fd34, fd20;
mul.f64 fd39, fd35, fd26;
mul.f64 fd40, fd34, fd26;
barrier.sync 0;
mad.lo.s32 r9, r7, 48, r8;
add.f64 fd41, %13, fd14;
add.f64 fd42, %12, fd13;
st.shared.v2.f64 [r9], {fd42, fd41};
fma.rn.f64 fd43, fd28, fd19, fd33;
sub.f64 fd44, fd31, fd32;
st.shared.v2.f64 [r9+16], {fd44, fd43};
fma.rn.f64 fd45, fd35, fd20, fd40;
sub.f64 fd46, fd38, fd39;
st.shared.v2.f64 [r9+32], {fd46, fd45};
barrier.sync 0;
shl.b32 r10, r7, 5;
sub.s32 r11, r9, r10;
ld.shared.v2.f64 {fd47, fd48}, [r11];
ld.shared.v2.f64 {fd51, fd52}, [r11+3888];
ld.shared.v2.f64 {fd55, fd56}, [r11+7776];
add.f64 fd59, fd51, fd55;
add.f64 fd60, fd52, fd56;
mul.f64 fd61, fd59, 0d3FE0000000000000;
sub.f64 fd62, fd47, fd61;
sub.f64 fd63, fd52, fd56;
mul.f64 fd64, fd63, 0d3FEBB67AE8584CAA;
add.f64 fd65, fd64, fd62;
sub.f64 fd66, fd62, fd64;
mul.f64 fd67, fd60, 0d3FE0000000000000;
sub.f64 fd68, fd48, fd67;
sub.f64 fd69, fd51, fd55;
mul.f64 fd70, fd69, 0d3FEBB67AE8584CAA;
sub.f64 fd71, fd68, fd70;
add.f64 fd72, fd70, fd68;
mul.wide.u32 rd7, r7, -1431655765;
shr.u64 rd8, rd7, 33;
cvt.u32.u64 r12, rd8;
mul.lo.s32 r13, r12, 3;
sub.s32 r14, r7, r13;
shl.b32 r15, r14, 4;
add.s32 r16, r8, r15;
mul.wide.u32 rd9, r12, 16;
mov.u64 rd10, %8;
add.s64 rd11, rd10, rd9;
ld.global.v2.f64 {fd73, fd74}, [rd11];
mul.f64 fd77, fd73, fd65;
mul.f64 fd78, fd74, fd71;
mul.f64 fd79, fd73, fd71;
ld.global.v2.f64 {fd80, fd81}, [rd11+1296];
mul.f64 fd84, fd80, fd66;
mul.f64 fd85, fd81, fd72;
mul.f64 fd86, fd80, fd72;
barrier.sync 0;
mad.lo.s32 r17, r12, 144, r16;
add.f64 fd87, fd48, fd60;
add.f64 fd88, fd47, fd59;
st.shared.v2.f64 [r17], {fd88, fd87};
fma.rn.f64 fd89, fd74, fd65, fd79;
sub.f64 fd90, fd77, fd78;
st.shared.v2.f64 [r17+48], {fd90, fd89};
fma.rn.f64 fd91, fd81, fd66, fd86;
sub.f64 fd92, fd84, fd85;
st.shared.v2.f64 [r17+96], {fd92, fd91};
barrier.sync 0;
ld.shared.v2.f64 {fd93, fd94}, [r11];
ld.shared.v2.f64 {fd97, fd98}, [r11+3888];
ld.shared.v2.f64 {fd101, fd102}, [r11+7776];
add.f64 fd105, fd97, fd101;
add.f64 fd106, fd98, fd102;
mul.f64 fd107, fd105, 0d3FE0000000000000;
sub.f64 fd108, fd93, fd107;
sub.f64 fd109, fd98, fd102;
mul.f64 fd110, fd109, 0d3FEBB67AE8584CAA;
add.f64 fd111, fd110, fd108;
sub.f64 fd112, fd108, fd110;
mul.f64 fd113, fd106, 0d3FE0000000000000;
sub.f64 fd114, fd94, fd113;
sub.f64 fd115, fd97, fd101;
mul.f64 fd116, fd115, 0d3FEBB67AE8584CAA;
sub.f64 fd117, fd114, fd116;
add.f64 fd118, fd116, fd114;
mul.wide.u32 rd12, r7, 954437177;
shr.u64 rd13, rd12, 33;
cvt.u32.u64 r18, rd13;
mul.lo.s32 r19, r18, 9;
sub.s32 r20, r7, r19;
shl.b32 r21, r20, 4;
add.s32 r22, r8, r21;
mul.wide.u32 rd14, r18, 16;
mov.u64 rd15, %9;
add.s64 rd16, rd15, rd14;
ld.global.v2.f64 {fd119, fd120}, [rd16];
mul.f64 fd123, fd119, fd111;
mul.f64 fd124, fd120, fd117;
mul.f64 fd125, fd119, fd117;
ld.global.v2.f64 {fd126, fd127}, [rd16+432];
mul.f64 fd130, fd126, fd112;
mul.f64 fd131, fd127, fd118;
mul.f64 fd132, fd126, fd118;
barrier.sync 0;
mad.lo.s32 r23, r18, 432, r22;
add.f64 fd133, fd94, fd106;
add.f64 fd134, fd93, fd105;
st.shared.v2.f64 [r23], {fd134, fd133};
fma.rn.f64 fd135, fd120, fd111, fd125;
sub.f64 fd136, fd123, fd124;
st.shared.v2.f64 [r23+144], {fd136, fd135};
fma.rn.f64 fd137, fd127, fd112, fd132;
sub.f64 fd138, fd130, fd131;
st.shared.v2.f64 [r23+288], {fd138, fd137};
barrier.sync 0;
ld.shared.v2.f64 {fd139, fd140}, [r11];
ld.shared.v2.f64 {fd143, fd144}, [r11+3888];
ld.shared.v2.f64 {fd147, fd148}, [r11+7776];
add.f64 fd151, fd143, fd147;
add.f64 fd152, fd144, fd148;
mul.f64 fd153, fd151, 0d3FE0000000000000;
sub.f64 fd154, fd139, fd153;
sub.f64 fd155, fd144, fd148;
mul.f64 fd156, fd155, 0d3FEBB67AE8584CAA;
add.f64 fd157, fd156, fd154;
sub.f64 fd158, fd154, fd156;
mul.f64 fd159, fd152, 0d3FE0000000000000;
sub.f64 fd160, fd140, fd159;
sub.f64 fd161, fd143, fd147;
mul.f64 fd162, fd161, 0d3FEBB67AE8584CAA;
sub.f64 fd163, fd160, fd162;
add.f64 fd164, fd162, fd160;
mul.wide.u32 rd17, r7, 795364315;
shr.u64 rd18, rd17, 32;
cvt.u32.u64 r24, rd18;
sub.s32 r25, r7, r24;
shr.u32 r26, r25, 1;
add.s32 r27, r26, r24;
shr.u32 r28, r27, 4;
mul.lo.s32 r29, r28, 27;
sub.s32 r30, r7, r29;
shl.b32 r31, r30, 4;
add.s32 r32, r8, r31;
mul.wide.u32 rd19, r28, 16;
mov.u64 rd20, %10;
add.s64 rd21, rd20, rd19;
ld.global.v2.f64 {fd165, fd166}, [rd21];
mul.f64 fd169, fd165, fd157;
mul.f64 fd170, fd166, fd163;
mul.f64 fd171, fd165, fd163;
ld.global.v2.f64 {fd172, fd173}, [rd21+144];
mul.f64 fd176, fd172, fd158;
mul.f64 fd177, fd173, fd164;
mul.f64 fd178, fd172, fd164;
barrier.sync 0;
mad.lo.s32 r33, r28, 1296, r32;
add.f64 fd179, fd140, fd152;
add.f64 fd180, fd139, fd151;
st.shared.v2.f64 [r33], {fd180, fd179};
fma.rn.f64 fd181, fd166, fd157, fd171;
sub.f64 fd182, fd169, fd170;
st.shared.v2.f64 [r33+432], {fd182, fd181};
fma.rn.f64 fd183, fd173, fd158, fd178;
sub.f64 fd184, fd176, fd177;
st.shared.v2.f64 [r33+864], {fd184, fd183};
barrier.sync 0;
ld.shared.v2.f64 {fd185, fd186}, [r11];
ld.shared.v2.f64 {fd189, fd190}, [r11+3888];
ld.shared.v2.f64 {fd193, fd194}, [r11+7776];
add.f64 fd197, fd189, fd193;
add.f64 fd198, fd190, fd194;
mul.f64 fd199, fd197, 0d3FE0000000000000;
sub.f64 fd200, fd185, fd199;
sub.f64 fd201, fd190, fd194;
mul.f64 fd202, fd201, 0d3FEBB67AE8584CAA;
add.f64 fd203, fd202, fd200;
sub.f64 fd204, fd200, fd202;
mul.f64 fd205, fd198, 0d3FE0000000000000;
sub.f64 fd206, fd186, fd205;
sub.f64 fd207, fd189, fd193;
mul.f64 fd208, fd207, 0d3FEBB67AE8584CAA;
sub.f64 fd209, fd206, fd208;
add.f64 fd210, fd208, fd206;
mul.wide.u32 rd22, r7, -901412889;
shr.u64 rd23, rd22, 38;
cvt.u32.u64 r34, rd23;
mul.lo.s32 r35, r34, 81;
sub.s32 r36, r7, r35;
shl.b32 r37, r36, 4;
add.s32 r38, r8, r37;
mul.wide.u32 rd24, r34, 16;
mov.u64 rd25, %11;
add.s64 rd26, rd25, rd24;
ld.global.v2.f64 {fd211, fd212}, [rd26];
mul.f64 fd215, fd211, fd203;
mul.f64 fd216, fd212, fd209;
mul.f64 fd217, fd211, fd209;
ld.global.v2.f64 {fd218, fd219}, [rd26+48];
mul.f64 fd222, fd218, fd204;
mul.f64 fd223, fd219, fd210;
mul.f64 fd224, fd218, fd210;
barrier.sync 0;
mad.lo.s32 r39, r34, 3888, r38;
add.f64 fd225, fd186, fd198;
add.f64 fd226, fd185, fd197;
st.shared.v2.f64 [r39], {fd226, fd225};
fma.rn.f64 fd227, fd212, fd203, fd217;
sub.f64 fd228, fd215, fd216;
st.shared.v2.f64 [r39+1296], {fd228, fd227};
fma.rn.f64 fd229, fd219, fd204, fd224;
sub.f64 fd230, fd222, fd223;
st.shared.v2.f64 [r39+2592], {fd230, fd229};
barrier.sync 0;
ld.shared.v2.f64 {fd231, fd232}, [r11];
ld.shared.v2.f64 {fd235, fd236}, [r11+3888];
ld.shared.v2.f64 {fd239, fd240}, [r11+7776];
add.f64 fd243, fd235, fd239;
add.f64 fd244, fd236, fd240;
mul.f64 fd245, fd243, 0d3FE0000000000000;
sub.f64 fd246, fd231, fd245;
sub.f64 fd247, fd236, fd240;
mul.f64 fd248, fd247, 0d3FEBB67AE8584CAA;
mul.f64 fd249, fd244, 0d3FE0000000000000;
sub.f64 fd250, fd232, fd249;
sub.f64 fd251, fd235, fd239;
mul.f64 fd252, fd251, 0d3FEBB67AE8584CAA;
add.f64 %1, fd232, fd244;
add.f64 %0, fd231, fd243;
sub.f64 %3, fd250, fd252;
add.f64 %2, fd248, fd246;
add.f64 %5, fd252, fd250;
sub.f64 %4, fd246, fd248;
})"
     : "=d"(rmem[0].x), "=d"(rmem[0].y), "=d"(rmem[1].x), "=d"(rmem[1].y), "=d"(rmem[2].x), "=d"(rmem[2].y): "r"(smem), "l"(lut_dp_3_729), "l"(lut_dp_3_243), "l"(lut_dp_3_81), "l"(lut_dp_3_27), "l"(lut_dp_3_9), "d"(rmem[0].x), "d"(rmem[0].y), "d"(rmem[1].x), "d"(rmem[1].y), "d"(rmem[1].y), "d"(rmem[2].x), "d"(rmem[2].y));
};


#endif
